Spaces:

wiizm
/

soyailabs

Running on CPU Upgrade

soyailabs / add_exaone_with_token.py

SOY NV AI

feat: Parent Chunk 湲곕뒫 異붽? 諛?RAG ?쒖뒪??媛쒖꽑

d54e6a9 16 days ago

5.97 kB

	"""
	EXAONE-3.0-7.8B-Instruct 모델을 Ollama에 추가하는 스크립트 (토큰 포함)
	"""

	import os
	import subprocess
	from pathlib import Path

	# Hugging Face 토큰
	HF_TOKEN = "YOUR_HUGGINGFACE_TOKEN_HERE"

	def set_huggingface_token():
	"""Hugging Face 토큰 설정"""
	os.environ['HUGGINGFACE_HUB_TOKEN'] = HF_TOKEN
	print(f"[OK] Hugging Face 토큰 설정 완료")

	def create_ollama_modelfile():
	"""Ollama Modelfile 생성"""
	modelfile_content = f"""FROM huggingface:LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct

	# 모델 설정
	PARAMETER temperature 0.7
	PARAMETER top_p 0.9
	PARAMETER top_k 40
	PARAMETER num_ctx 4096
	PARAMETER num_predict 512

	# 시스템 프롬프트
	SYSTEM \"\"\"You are EXAONE, a helpful AI assistant developed by LG AI Research.
	You are designed to be helpful, harmless, and honest.
	You can communicate in both Korean and English.\"\"\"

	# EXAONE 모델의 채팅 템플릿
	TEMPLATE \"\"\"{{{{ if .System }}}}<\|im_start\|>system
	{{{{ .System }}}}<\|im_end\|>
	{{{{ end }}}}{{{{ if .Prompt }}}}<\|im_start\|>user
	{{{{ .Prompt }}}}<\|im_end\|>
	{{{{ end }}}}<\|im_start\|>assistant
	{{{{ .Response }}}}<\|im_end\|>
	\"\"\"
	"""

	modelfile_path = Path("EXAONE-3.0-7.8B-Instruct.modelfile")
	modelfile_path.write_text(modelfile_content, encoding='utf-8')
	print(f"[OK] Modelfile 생성 완료: {modelfile_path.absolute()}")
	return modelfile_path

	def create_model_with_modelfile(modelfile_path):
	"""Modelfile을 사용하여 Ollama 모델 생성"""
	try:
	print("\n" + "=" * 60)
	print("Ollama 모델 생성 시작...")
	print("=" * 60)

	# 환경 변수 설정
	env = os.environ.copy()
	env['HUGGINGFACE_HUB_TOKEN'] = HF_TOKEN

	# ollama create 명령어 실행
	cmd = ['ollama', 'create', 'EXAONE-3.0-7.8B-Instruct', '-f', str(modelfile_path)]
	print(f"실행 명령어: {' '.join(cmd)}")

	result = subprocess.run(
	cmd,
	env=env,
	capture_output=True,
	text=True,
	timeout=3600 # 1시간 타임아웃
	)

	if result.returncode == 0:
	print("[OK] 모델 생성 성공!")
	print(result.stdout)
	return True
	else:
	print("[ERROR] 모델 생성 실패")
	print("오류 출력:")
	print(result.stderr)
	return False

	except subprocess.TimeoutExpired:
	print("[ERROR] 모델 생성 시간 초과 (1시간)")
	return False
	except Exception as e:
	print(f"[ERROR] 오류 발생: {e}")
	return False

	def check_ollama_installation():
	"""Ollama 설치 확인"""
	try:
	result = subprocess.run(['ollama', '--version'],
	capture_output=True, text=True, timeout=5)
	if result.returncode == 0:
	version = result.stdout.strip()
	print(f"[OK] Ollama 설치 확인: {version}")
	return True
	else:
	print("[ERROR] Ollama가 설치되어 있지 않습니다.")
	return False
	except FileNotFoundError:
	print("[ERROR] Ollama가 설치되어 있지 않습니다.")
	print(" 설치 방법: https://ollama.ai/download")
	return False
	except Exception as e:
	print(f"[ERROR] Ollama 확인 중 오류: {e}")
	return False

	def verify_model():
	"""생성된 모델 확인"""
	try:
	result = subprocess.run(['ollama', 'list'],
	capture_output=True, text=True, timeout=5)
	if result.returncode == 0:
	if 'EXAONE-3.0-7.8B-Instruct' in result.stdout:
	print("\n[OK] 모델이 성공적으로 추가되었습니다!")
	print("\n설치된 모델 목록:")
	print(result.stdout)
	return True
	else:
	print("\n[WARNING] 모델이 목록에 나타나지 않습니다.")
	print("\n현재 설치된 모델:")
	print(result.stdout)
	return False
	return False
	except Exception as e:
	print(f"[WARNING] 모델 확인 중 오류: {e}")
	return False

	if __name__ == "__main__":
	print("\n" + "=" * 60)
	print("EXAONE-3.0-7.8B-Instruct Ollama 추가 스크립트")
	print("=" * 60 + "\n")

	# 사전 확인
	if not check_ollama_installation():
	print("\n[WARNING] Ollama를 먼저 설치해주세요.")
	exit(1)

	# 토큰 설정
	set_huggingface_token()

	# Modelfile 생성
	modelfile_path = create_ollama_modelfile()

	# 모델 생성 확인
	print("\n[WARNING] 주의사항:")
	print("- 모델 크기가 약 15GB이므로 다운로드에 시간이 걸릴 수 있습니다.")
	print("- 충분한 디스크 공간과 GPU 메모리가 필요합니다.")
	print("- Hugging Face에서 모델 액세스 권한이 필요합니다.")

	# 모델 생성 시작
	print("\n모델 생성을 시작합니다...")

	# 모델 생성
	success = create_model_with_modelfile(modelfile_path)

	if success:
	verify_model()
	print("\n" + "=" * 60)
	print("[OK] 모델 추가 완료!")
	print("=" * 60)
	print("\n이제 웹 애플리케이션에서 모델을 사용할 수 있습니다.")
	print("모델 테스트:")
	print(" ollama run EXAONE-3.0-7.8B-Instruct \"안녕하세요\"")
	print("=" * 60)
	else:
	print("\n" + "=" * 60)
	print("[ERROR] 모델 생성 실패")
	print("=" * 60)
	print("\n수동으로 모델을 생성하려면:")
	print(f" 1. Hugging Face 토큰 설정:")
	print(f" $env:HUGGINGFACE_HUB_TOKEN='{HF_TOKEN}'")
	print(f" 2. Modelfile로 모델 생성:")
	print(f" ollama create EXAONE-3.0-7.8B-Instruct -f {modelfile_path}")
	print("=" * 60)