gihakkk
/

MLP_test

Model card Files Files and versions

xet

Community

gihakkk commited on Sep 14, 2025

Commit

0873620

verified ·

1 Parent(s): 66d4dbb

Upload MLP.py

Browse files

Files changed (1) hide show

MLP.py +69 -0

MLP.py ADDED Viewed

	@@ -0,0 +1,69 @@

+import numpy as np
+# 하이퍼파라미터 설정
+input_size = 2       # 입력층 노드 수
+hidden_size = 3      # 은닉층 노드 수
+output_size = 1      # 출력층 노드 수
+learning_rate = 0.5  # 학습률
+epochs = 10000       # 학습 반복 횟수
+# 1. 데이터셋 정의 (XOR 문제)
+# 입력 데이터: [0,0], [0,1], [1,0], [1,1]
+X = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
+# 정답 레이블: [0], [1], [1], [0]
+y = np.array([[0], [1], [1], [0]])
+# 2. 가중치(W)와 편향(b) 초기화
+W1 = np.random.randn(input_size, hidden_size)
+b1 = np.random.randn(hidden_size)
+W2 = np.random.randn(hidden_size, output_size)
+b2 = np.random.randn(output_size)
+# 3. 활성화 함수와 그 미분 함수 정의
+def sigmoid(x):
+    return 1 / (1 + np.exp(-x))
+def sigmoid_derivative(x):
+    return x * (1 - x)
+# 4. 학습 시작
+for epoch in range(epochs):
+    # 순전파 (Forward Propagation)
+    # 은닉층
+    hidden_output = np.dot(X, W1) + b1
+    hidden_activation = sigmoid(hidden_output)
+    # 출력층
+    output_output = np.dot(hidden_activation, W2) + b2
+    predicted_output = sigmoid(output_output)
+    # 역전파 (Backpropagation)
+    # 1단계: 출력층의 오차와 기울기 계산
+    error_output = y - predicted_output
+    delta_output = error_output * sigmoid_derivative(predicted_output)
+    # 2단계: 은닉층의 오차와 기울기 계산
+    error_hidden = np.dot(delta_output, W2.T)
+    delta_hidden = error_hidden * sigmoid_derivative(hidden_activation)
+    # 3단계: 가중치와 편향 업데이트
+    W2 += np.dot(hidden_activation.T, delta_output) * learning_rate
+    b2 += np.sum(delta_output, axis=0) * learning_rate
+    W1 += np.dot(X.T, delta_hidden) * learning_rate
+    b1 += np.sum(delta_hidden, axis=0) * learning_rate
+    # 매 1000번째 epoch마다 오차 출력
+    if epoch % 1000 == 0:
+        loss = np.mean(np.abs(error_output))
+        print(f"Epoch: {epoch}, Loss: {loss:.4f}")
+print("\n--- 학습 완료 ---")
+# 5. 학습된 모델로 예측 (결과 확인)
+hidden_output_final = np.dot(X, W1) + b1
+hidden_activation_final = sigmoid(hidden_output_final)
+predicted_final = sigmoid(np.dot(hidden_activation_final, W2) + b2)
+print("입력 데이터:\n", X)
+print("예측 결과:\n", predicted_final.round())
+print("정답 레이블:\n", y)