Spaces:

hyungjoochae
/

chat-and-answer-completion

Sleeping

chat-and-answer-completion / guide_generation /test.py

2b267d0 6 months ago

7.43 kB

	import os
	import random
	import datetime
	import json
	import multiprocessing
	import sys
	from tqdm import tqdm

	# 상위 디렉토리의 utils.py를 import하기 위해 경로 추가
	sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), '..')))
	from utils import track_api_cost
	from llm_functions import generate_guide

	# 테스트를 위한 환경 변수 로드 (필요시)
	try:
	from dotenv import load_dotenv
	load_dotenv()
	except ImportError:
	pass

	# 예제 데이터
	example_companies = ["삼성전자", "카카오", "네이버", "쿠팡", "토스", "현대자동차", "CJ제일제당", "하이브"]
	example_jobs_jds = {
	"백엔드 개발자": "Spring Boot, JPA, MySQL 경험자. MSA 환경 경험 우대. 클라우드(AWS) 환경 배포 및 운영 경험자.",
	"프론트엔드 개발자": "React, TypeScript, Redux 사용. 반응형 웹 개발 경험 필수. UI/UX에 대한 이해도가 높은 분.",
	"데이터 분석가": "SQL, Python(Pandas, Scikit-learn) 활용 능력. 통계적 지식과 데이터 시각화(Tableau 등) 능력.",
	"프로덕트 매니저(PM)": "IT 프로덕트 기획 및 관리 경험. 사용자 스토리 작성, 백로그 관리. 데이터 기반 의사결정 능력.",
	"마케터": "디지털 마케팅(SA, DA, SEO) 경험. 콘텐츠 기획 및 제작, 성과 분석. SNS 채널 운영 경험."
	}
	example_questions = {
	"지원동기": "{company_name}에 지원한 동기에 대해 기술해주십시오.",
	"성장과정": "본인의 성장과정을 간략히 기술하되 현재의 자신에게 가장 큰 영향을 끼친 사건, 인물 등을 포함하여 기술해주십시오.",
	"직무역량": "{job_title} 직무 수행에 필요한 역량은 무엇이라고 생각하며, 이를 갖추기 위해 어떤 노력을 해왔는지 기술해주십시오.",
	"입사후포부": "입사 후 10년 동안의 회사생활 시나리오와 그것을 추구하는 이유를 기술해주십시오."
	}
	experience_levels = ["신입", "경력", "인턴"]

	NUM_TESTS = 100
	NUM_PROCESSES = 10
	MODEL_NAME = "gpt-4o-mini"

	def run_test(test_input_with_id):
	"""개별 테스트 케이스를 실행하는 워커 함수"""
	test_id, test_input = test_input_with_id
	total_cost = 0
	error_message = ""
	status = "✅ Success"

	try:
	parsed_guide, response = generate_guide(**test_input)

	if response and hasattr(response, 'usage'):
	total_cost = track_api_cost(response, MODEL_NAME, None)

	if "error" in parsed_guide or not parsed_guide:
	status = "❌ Failure"
	error_message = str(parsed_guide.get("error", "Unknown failure"))

	return {
	"id": test_id,
	"input": test_input,
	"parsed_result": parsed_guide,
	"error": error_message,
	"cost": total_cost,
	"status": status,
	}
	except Exception as e:
	return {
	"id": test_id,
	"input": test_input,
	"parsed_result": {},
	"error": f"Exception: {str(e)}",
	"cost": total_cost,
	"status": "❌ Error"
	}

	def main():
	"""테스트를 준비, 실행하고 보고서를 생성하는 메인 함수"""
	print(f"총 {NUM_TESTS}개의 테스트를 {NUM_PROCESSES}개 프로세스로 병렬 실행합니다...")

	test_inputs = []
	for i in range(NUM_TESTS):
	company = random.choice(example_companies)
	job_title, jd = random.choice(list(example_jobs_jds.items()))
	question_type, question_template = random.choice(list(example_questions.items()))
	question = question_template.format(company_name=company, job_title=job_title)
	experience = random.choice(experience_levels)

	test_input = {
	"company_name": company,
	"jd": jd,
	"question": question,
	"experience_level": experience
	}
	test_inputs.append((i + 1, test_input))

	results = []
	with multiprocessing.Pool(processes=NUM_PROCESSES) as pool:
	with tqdm(total=NUM_TESTS, desc="가이드 생성 테스트") as pbar:
	for result in pool.imap_unordered(run_test, test_inputs):
	results.append(result)
	pbar.update()

	results.sort(key=lambda x: x['id'])
	print("모든 테스트가 완료되었습니다.")

	now = datetime.datetime.now()
	report_filename = f"guide_generation_report_{now.strftime('%Y%m%d_%H%M%S')}.html"

	failure_count = sum(1 for r in results if "Success" not in r["status"])
	total_cost = sum(r['cost'] for r in results)
	failure_rate = (failure_count / NUM_TESTS) * 100 if NUM_TESTS > 0 else 0

	html_template = """
	<!DOCTYPE html><html lang="ko"><head><meta charset="UTF-8"><title>가이드 생성 테스트 보고서</title>
	<style>body{{font-family:sans-serif;margin:20px;}} h1,h2{{text-align:center;}} .summary{{border:1px solid #ddd;padding:20px;margin-bottom:20px;}} table{{width:100%;border-collapse:collapse;}} th,td{{border:1px solid #ddd;padding:8px;text-align:left;vertical-align:top;}} th{{background-color:#f2f2f2;}} .status-success{{color:green;font-weight:bold;}} .status-failure{{color:red;font-weight:bold;}} pre{{white-space:pre-wrap;word-wrap:break-word;background-color:#f9f9f9;padding:10px;border:1px solid #ddd;}} .container{{max-width:1400px;margin:auto;}}</style>
	</head><body><div class="container"><h1>가이드 생성 테스트 보고서</h1><div class="summary"><h2>요약</h2><p><strong>테스트 시간:</strong> {now}</p><p><strong>총 테스트 수:</strong> {total_tests}</p><p><strong>성공:</strong> {success_count}</p><p><strong>실패/에러:</strong> {failure_count}</p><p><strong>실패율:</strong> <span class="{status_class}">{failure_rate:.2f}%</span></p><p><strong>총 예상 비용:</strong> ${total_cost:.6f}</p></div>
	<h2>상세 결과</h2><table><thead><tr><th>ID</th><th>입력 (Input)</th><th>파싱 결과 (Parsed)</th><th>에러</th><th>비용</th><th>상태</th></tr></thead><tbody>{table_rows}</tbody></table></div></body></html>
	"""

	table_rows_html = ""
	for res in results:
	status_class = "status-success" if "Success" in res["status"] else "status-failure"
	table_rows_html += f"""
	<tr>
	<td>{res['id']}</td>
	<td><pre>{json.dumps(res['input'], indent=2, ensure_ascii=False)}</pre></td>
	<td><pre>{json.dumps(res['parsed_result'], indent=2, ensure_ascii=False)}</pre></td>
	<td><pre>{res['error']}</pre></td>
	<td>${res['cost']:.6f}</td>
	<td class="{status_class}">{res['status']}</td>
	</tr>
	"""

	final_html = html_template.format(
	now=now.strftime('%Y-%m-%d %H:%M:%S'),
	total_tests=NUM_TESTS,
	success_count=NUM_TESTS - failure_count,
	failure_count=failure_count,
	status_class="status-success" if failure_rate < 10 else "status-failure",
	failure_rate=failure_rate,
	total_cost=total_cost,
	table_rows=table_rows_html
	)

	with open(report_filename, "w", encoding="utf-8") as f:
	f.write(final_html)

	print(f"'{report_filename}' 파일로 보고서가 저장되었습니다.")
	print(f"총 예상 비용: ${total_cost:.6f}")

	if __name__ == "__main__":
	main()