feat: drop unused presets (qwen2.5-1.5b, qwen3-1.7b)
Browse files- src/kpaa/llm/presets.py +0 -18
src/kpaa/llm/presets.py
CHANGED
|
@@ -50,15 +50,6 @@ PRESETS: list[ModelPreset] = [
|
|
| 50 |
hf_repo="google/gemma-4-E2B-it",
|
| 51 |
family="gemma",
|
| 52 |
),
|
| 53 |
-
ModelPreset(
|
| 54 |
-
id="qwen2.5-1.5b",
|
| 55 |
-
label="Qwen2.5 1.5B Instruct (가장 빠름)",
|
| 56 |
-
short="1.5B · 토큰 속도 최우선 · 한국어 톤은 다소 뻣뻣",
|
| 57 |
-
llama_cpp_repo="bartowski/Qwen2.5-1.5B-Instruct-GGUF",
|
| 58 |
-
llama_cpp_file="Qwen2.5-1.5B-Instruct-Q4_K_M.gguf",
|
| 59 |
-
hf_repo="Qwen/Qwen2.5-1.5B-Instruct",
|
| 60 |
-
family="qwen2.5",
|
| 61 |
-
),
|
| 62 |
ModelPreset(
|
| 63 |
id="qwen2.5-3b",
|
| 64 |
label="Qwen2.5 3B Instruct (빠름·안정)",
|
|
@@ -68,15 +59,6 @@ PRESETS: list[ModelPreset] = [
|
|
| 68 |
hf_repo="Qwen/Qwen2.5-3B-Instruct",
|
| 69 |
family="qwen2.5",
|
| 70 |
),
|
| 71 |
-
ModelPreset(
|
| 72 |
-
id="qwen3-1.7b",
|
| 73 |
-
label="Qwen3 1.7B (최신·빠름)",
|
| 74 |
-
short="1.7B · 최신 세대 · 다국어 토크나이저 개선",
|
| 75 |
-
llama_cpp_repo="bartowski/Qwen_Qwen3-1.7B-GGUF",
|
| 76 |
-
llama_cpp_file="Qwen_Qwen3-1.7B-Q4_K_M.gguf",
|
| 77 |
-
hf_repo="Qwen/Qwen3-1.7B",
|
| 78 |
-
family="qwen3",
|
| 79 |
-
),
|
| 80 |
ModelPreset(
|
| 81 |
id="qwen3-4b-instruct-2507",
|
| 82 |
label="Qwen3 4B Instruct 2507 (큰 모델·non-thinking)",
|
|
|
|
| 50 |
hf_repo="google/gemma-4-E2B-it",
|
| 51 |
family="gemma",
|
| 52 |
),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 53 |
ModelPreset(
|
| 54 |
id="qwen2.5-3b",
|
| 55 |
label="Qwen2.5 3B Instruct (빠름·안정)",
|
|
|
|
| 59 |
hf_repo="Qwen/Qwen2.5-3B-Instruct",
|
| 60 |
family="qwen2.5",
|
| 61 |
),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 62 |
ModelPreset(
|
| 63 |
id="qwen3-4b-instruct-2507",
|
| 64 |
label="Qwen3 4B Instruct 2507 (큰 모델·non-thinking)",
|