Spaces:

speako
/

llama-server

Sleeping

App Files Files Community

llama-server / model /llama3.py

bigeco

Update model/llama3.py

feaeb6d verified 10 months ago

raw

history blame contribute delete

3.37 kB

	import yaml
	import argparse
	from openai import OpenAI

	# TODO 1: 하이퍼파라미터 조정 필요. (실험 테스트 필요)
	# TODO 2: 결과가 ()->() 벗어날 경우를 대비해 처리 코드 작성 필요.
	# TODO 3: 결과 에서 자모 기준으로 잘못 발음한 부분 추출 코드 작성 필요.
	# TODO 4: 다중 입력 처리(batch) 처리 가능하도록. 파일이나 리스트로 여러 user_input/correct_input 받아 일괄 처리
	# TODO 5: 생성 결과 평가 지표 필요.
	import yaml
	import argparse
	from hangul_romanize import Transliter
	from hangul_romanize.rule import academic

	# TODO 1: 하이퍼파라미터 조정 필요. (실험 테스트 필요)
	# TODO 2: 결과가 () -> () 뒷어날 경우를 대비해 처리 코드 작성 필요.
	# TODO 3: 결과 에서 자모 기준으로 잠못 발음된 부분 추출 코드 작성 필요.
	# TODO 4: 다중 입력 처리(batch) 처리 가능하도록. 파일이나 리스트로 여러 user_input/correct_input 받아 일괄
	# TODO 5: 성장 결과 평가 지표 필요.

	class LLaMA3:
	def __init__(self, config: str):
	# hangul-romanize 라이브러리 초기화
	self.transliter = Transliter(academic)

	# 프롬프트 템플릿 설정 (사용하지 않지만 기존 구조 유지)
	self.prompt_template = config.get("prompt_template", "")

	# 모델 설정 (사용하지 않지만 기존 구조 유지)
	self.model = config.get("model", {}).get("id", "")

	def add_hyphens(self, korean_text):
	"""음절별로 분리해서 하이픈 추가"""
	syllables = list(korean_text)
	romanized_syllables = []

	for syllable in syllables:
	romanized = self.transliter.translit(syllable)
	romanized_syllables.append(romanized)

	return '-'.join(romanized_syllables)

	def generate(self, user_input: str, correct_input: str) -> str:
	# user_input을 로마자로 변환 (괄호 제거)
	user_korean = user_input.strip('()')
	user_romanized = self.add_hyphens(user_korean)

	# correct_input을 로마자로 변환 (괄호 제거)
	correct_korean = correct_input.strip('()')
	correct_romanized = self.add_hyphens(correct_korean)

	# (user_romanized) -> (correct_romanized) 형식으로 반환
	result = f"({user_romanized})->({correct_romanized})"

	return result

	# def parse_args() -> argparse.Namespace:
	# parser = argparse.ArgumentParser(description="LLaMA3 pronunciation correction pipeline.")
	# parser.add_argument("--config_path", type=str, default="data/config/llama3.yaml", help="모델 설정 및 프롬프트 정보를 담은 YAML 파일 경로")
	# parser.add_argument("--user_input", type=str, default="박끼", help="잘못 발음된 단어")
	# parser.add_argument("--correct_input", type=str, default="발끼", help="정확한 발음 단어")
	# return parser.parse_args()

	# def main():
	# args = parse_args()

	# # 설정 파일 로드
	# with open(args.config_path, "r") as f:
	# config = yaml.safe_load(f)

	# # 모델 로드 및 결과 반환
	# llama3 = LLaMA3(config)
	# output = llama3.generate(args.user_input, args.correct_input)
	# print(output)

	# if __name__ == "__main__":
	# main()