gihakkk
/

MLP_test

Model card Files Files and versions

MLP_test / MLP.py

gihakkk's picture

Upload MLP.py

0873620 verified 5 months ago

history blame contribute delete

2.38 kB

	import numpy as np

	# 하이퍼파라미터 설정
	input_size = 2 # 입력층 노드 수
	hidden_size = 3 # 은닉층 노드 수
	output_size = 1 # 출력층 노드 수
	learning_rate = 0.5 # 학습률
	epochs = 10000 # 학습 반복 횟수

	# 1. 데이터셋 정의 (XOR 문제)
	# 입력 데이터: [0,0], [0,1], [1,0], [1,1]
	X = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
	# 정답 레이블: [0], [1], [1], [0]
	y = np.array([[0], [1], [1], [0]])

	# 2. 가중치(W)와 편향(b) 초기화
	W1 = np.random.randn(input_size, hidden_size)
	b1 = np.random.randn(hidden_size)
	W2 = np.random.randn(hidden_size, output_size)
	b2 = np.random.randn(output_size)

	# 3. 활성화 함수와 그 미분 함수 정의
	def sigmoid(x):
	return 1 / (1 + np.exp(-x))

	def sigmoid_derivative(x):
	return x * (1 - x)

	# 4. 학습 시작
	for epoch in range(epochs):
	# 순전파 (Forward Propagation)
	# 은닉층
	hidden_output = np.dot(X, W1) + b1
	hidden_activation = sigmoid(hidden_output)

	# 출력층
	output_output = np.dot(hidden_activation, W2) + b2
	predicted_output = sigmoid(output_output)

	# 역전파 (Backpropagation)
	# 1단계: 출력층의 오차와 기울기 계산
	error_output = y - predicted_output
	delta_output = error_output * sigmoid_derivative(predicted_output)

	# 2단계: 은닉층의 오차와 기울기 계산
	error_hidden = np.dot(delta_output, W2.T)
	delta_hidden = error_hidden * sigmoid_derivative(hidden_activation)

	# 3단계: 가중치와 편향 업데이트
	W2 += np.dot(hidden_activation.T, delta_output) * learning_rate
	b2 += np.sum(delta_output, axis=0) * learning_rate
	W1 += np.dot(X.T, delta_hidden) * learning_rate
	b1 += np.sum(delta_hidden, axis=0) * learning_rate

	# 매 1000번째 epoch마다 오차 출력
	if epoch % 1000 == 0:
	loss = np.mean(np.abs(error_output))
	print(f"Epoch: {epoch}, Loss: {loss:.4f}")

	print("\n--- 학습 완료 ---")

	# 5. 학습된 모델로 예측 (결과 확인)
	hidden_output_final = np.dot(X, W1) + b1
	hidden_activation_final = sigmoid(hidden_output_final)
	predicted_final = sigmoid(np.dot(hidden_activation_final, W2) + b2)

	print("입력 데이터:\n", X)
	print("예측 결과:\n", predicted_final.round())
	print("정답 레이블:\n", y)