Dongjin1203 commited on
Commit
b3d3fe8
ยท
1 Parent(s): 3920e00

Add Base model GGUF support

Browse files
Files changed (2) hide show
  1. src/compare_models.py +4 -4
  2. src/utils/config.py +1 -1
src/compare_models.py CHANGED
@@ -77,10 +77,10 @@ class ModelComparison:
77
  logger.info("โœ… QLoRA ๋‹จ๋… ๋กœ๋“œ ์™„๋ฃŒ")
78
 
79
  # 3. Base + RAG (PEFT ์ œ๊ฑฐ) - TODO: GGUF ๋ณ€ํ™˜ ํ›„ ์ถ”๊ฐ€
80
- # logger.info("\n[3/3] Base + RAG ๋ชจ๋ธ ๋กœ๋”ฉ...")
81
- # from src.generator.generator_gguf_base import GGUFBaseRAGPipeline
82
- # self.pipelines['base_rag'] = GGUFBaseRAGPipeline(config=self.config)
83
- # logger.info("โœ… Base + RAG ๋กœ๋“œ ์™„๋ฃŒ")
84
  logger.warning("\nโš ๏ธ Base + RAG ์Šคํ‚ต: Base ๋ชจ๋ธ GGUF ๋ณ€ํ™˜ ํ›„ ์ถ”๊ฐ€ ์˜ˆ์ •")
85
 
86
  except Exception as e:
 
77
  logger.info("โœ… QLoRA ๋‹จ๋… ๋กœ๋“œ ์™„๋ฃŒ")
78
 
79
  # 3. Base + RAG (PEFT ์ œ๊ฑฐ) - TODO: GGUF ๋ณ€ํ™˜ ํ›„ ์ถ”๊ฐ€
80
+ logger.info("\n[3/3] Base + RAG ๋ชจ๋ธ ๋กœ๋”ฉ...")
81
+ from src.generator.generator_gguf_base import GGUFBaseRAGPipeline
82
+ self.pipelines['base_rag'] = GGUFBaseRAGPipeline(config=self.config)
83
+ logger.info("โœ… Base + RAG ๋กœ๋“œ ์™„๋ฃŒ")
84
  logger.warning("\nโš ๏ธ Base + RAG ์Šคํ‚ต: Base ๋ชจ๋ธ GGUF ๋ณ€ํ™˜ ํ›„ ์ถ”๊ฐ€ ์˜ˆ์ •")
85
 
86
  except Exception as e:
src/utils/config.py CHANGED
@@ -71,7 +71,7 @@ class Config:
71
  # 2. Base ๋ชจ๋ธ (PEFT ์—†์Œ) - ๋น„๊ต ์‹คํ—˜์šฉ
72
  self.BASE_MODEL_HUB_REPO = os.getenv(
73
  "BASE_MODEL_HUB_REPO",
74
- "beomi/Llama-3-Open-Ko-8B-gguf"
75
  )
76
  self.BASE_MODEL_HUB_FILENAME = os.getenv(
77
  "BASE_MODEL_HUB_FILENAME",
 
71
  # 2. Base ๋ชจ๋ธ (PEFT ์—†์Œ) - ๋น„๊ต ์‹คํ—˜์šฉ
72
  self.BASE_MODEL_HUB_REPO = os.getenv(
73
  "BASE_MODEL_HUB_REPO",
74
+ "Llama-3-Open-Ko-8B-Q4_K_M.gguf"
75
  )
76
  self.BASE_MODEL_HUB_FILENAME = os.getenv(
77
  "BASE_MODEL_HUB_FILENAME",