File size: 4,062 Bytes
9a7964b
 
 
 
59e2c8a
 
1706cd9
727cb75
 
9a7964b
 
b16996a
 
 
 
 
f409660
b16996a
727cb75
 
 
 
bd75839
727cb75
 
 
 
9a7964b
b16996a
9a7964b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
59e2c8a
 
 
 
 
 
 
 
 
 
 
 
 
9939b9d
727cb75
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
aac5f23
 
 
 
 
 
 
 
 
 
 
 
 
 
9939b9d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
# Model preset registry for dev and Hugging Face Space.
# Select active preset with ACTIVE_MODEL; override any field via .env (see .env.example).

defaults:
  # active_model: minicpm-v-4.6
  active_model: minicpm5-1b

  # Default true for local dev (dropdown in Gradio). Space: set ALLOW_MODEL_SWITCH=false.
  allow_model_switch: true

models:
  minicpm-v-4.6:
    label: MiniCPM-V 4.6 (Transformers, ~0.8B, default)
    backend: transformers
    model_id: openbmb/MiniCPM-V-4.6
    trust_remote_code: true
    multimodal: true

  minicpm-v-4.6-gguf:
    label: MiniCPM-V 4.6 (GGUF / llama.cpp)
    backend: llama_cpp
    model_repo: openbmb/MiniCPM-V-4.6-gguf
    model_file: MiniCPM-V-4_6-Q4_K_M.gguf
    multimodal: true
    n_ctx: 8192
    n_gpu_layers: 0

  qwen3b-gguf:
    label: Qwen 2.5 3B Instruct (GGUF)
    backend: llama_cpp
    model_repo: Qwen/Qwen2.5-3B-Instruct-GGUF
    model_file: qwen2.5-3b-instruct-q4_k_m.gguf
    n_ctx: 4096
    n_gpu_layers: 0

  llama32-3b-gguf:
    label: Llama 3.2 3B Instruct (GGUF)
    backend: llama_cpp
    model_repo: bartowski/Llama-3.2-3B-Instruct-GGUF
    model_file: Llama-3.2-3B-Instruct-Q4_K_M.gguf
    n_ctx: 4096
    n_gpu_layers: 0

  minicpm5-1b:
    label: MiniCPM5 1B (Transformers)
    backend: transformers
    model_id: openbmb/MiniCPM5-1B
    trust_remote_code: true

  gemma4-e2b-mobile:
    label: Gemma 4 E2B IT QAT Mobile (Transformers)
    backend: transformers
    model_id: google/gemma-4-E2B-it-qat-mobile-transformers
    trust_remote_code: true

  gemma-merged-local:
    label: Fine-tuned merged model (local path)
    backend: transformers
    model_id: ./gemma_merged_model

  gemma-lora-local:
    label: Fine-tuned LoRA adapter (local path)
    backend: transformers
    model_id: ./gemma_finetuned_model

  minicpm5-1b-lesson-lora:
    label: MiniCPM5 1B lesson LoRA (local)
    backend: transformers
    model_id: openbmb/MiniCPM5-1B
    adapter_path: ./models/finetuned/minicpm5-1b-lora
    trust_remote_code: true

  minicpm5-1b-lesson-merged:
    label: MiniCPM5 1B lesson merged (local)
    backend: transformers
    model_id: ./models/finetuned/minicpm5-1b-lora-merged
    trust_remote_code: true

  # Well-Tuned track: base MiniCPM5-1B + a Modal-published LoRA adapter pulled
  # straight from the Hub (no local files needed). These point at the repos the
  # finetune pipeline publishes once a job clears its lm-eval gate
  # (research/modal/experiments.yaml -> publish.hub_repo).
  minicpm5-1b-teaching-hub:
    label: MiniCPM5 1B teaching LoRA (Hub, fine-tuned)
    backend: transformers
    model_id: openbmb/MiniCPM5-1B
    adapter_path: MSGEncrypted/minicpm5-1b-teaching-lora
    trust_remote_code: true

  minicpm5-1b-math-hub:
    label: MiniCPM5 1B math LoRA (Hub, fine-tuned)
    backend: transformers
    model_id: openbmb/MiniCPM5-1B
    adapter_path: MSGEncrypted/minicpm5-1b-math-lora
    trust_remote_code: true

  minicpm5-1b-language-lesson-hub:
    label: MiniCPM5 1B language lesson LoRA (FR/AR, Hub)
    backend: transformers
    model_id: openbmb/MiniCPM5-1B
    adapter_path: MSGEncrypted/minicpm5-1b-language-lesson-lora
    trust_remote_code: true

  minicpm5-1b-language-lesson-lora:
    label: MiniCPM5 1B language lesson LoRA (FR/AR, local)
    backend: transformers
    model_id: openbmb/MiniCPM5-1B
    adapter_path: ./models/finetuned/language-lesson-lora
    trust_remote_code: true

  tiny-aya-global:
    label: Tiny Aya Global 3.3B (multilingual coach)
    backend: transformers
    model_id: CohereLabs/tiny-aya-global
    trust_remote_code: true

  tiny-aya-water:
    label: Tiny Aya Water 3.3B (European / Asia-Pacific)
    backend: transformers
    model_id: CohereLabs/tiny-aya-water
    trust_remote_code: true

  tiny-aya-fire:
    label: Tiny Aya Fire 3.3B (South Asian)
    backend: transformers
    model_id: CohereLabs/tiny-aya-fire
    trust_remote_code: true

  tiny-aya-earth:
    label: Tiny Aya Earth 3.3B (West Asian / African)
    backend: transformers
    model_id: CohereLabs/tiny-aya-earth
    trust_remote_code: true