AaryanK commited on
Commit
fe74938
·
verified ·
1 Parent(s): dd94c69

Change to MIT consistent with Git

Browse files
Files changed (1) hide show
  1. README.md +32 -32
README.md CHANGED
@@ -1,44 +1,44 @@
1
  ---
2
  language:
3
- - en
4
- license: apache-2.0
5
  library_name: llama-cpp-python
6
  base_model: katanemo/Arch-Router-1.5B
7
  tags:
8
- - routing
9
- - grpo
10
- - reinforcement-learning
11
- - gguf
12
- - lora
13
- - unsloth
14
- - trl
15
- - qwen2
16
- - llama-cpp
17
- - contract-aware
18
- - cost-optimization
19
- - query-classification
20
  model_type: qwen2
21
  pipeline_tag: text-classification
22
  datasets:
23
- - custom
24
  metrics:
25
- - accuracy
26
  model-index:
27
- - name: ModelGate-Router
28
- results:
29
- - task:
30
- type: text-classification
31
- name: Query Complexity Classification
32
- metrics:
33
- - type: accuracy
34
- value: 83.3
35
- name: Overall Accuracy (held-out, GGUF Q8_0)
36
- - type: accuracy
37
- value: 85.7
38
- name: Medium Tier Accuracy
39
- - type: latency
40
- value: 62
41
- name: Avg Latency (ms, CUDA)
42
  ---
43
 
44
  <p align="center">
@@ -257,4 +257,4 @@ scripts/
257
  bench_mmlu.py # MMLU benchmark runner
258
  mmlu_questions.json # 60 real MMLU questions from HuggingFace
259
  start.sh # One-command startup
260
- ```
 
1
  ---
2
  language:
3
+ - en
4
+ license: mit
5
  library_name: llama-cpp-python
6
  base_model: katanemo/Arch-Router-1.5B
7
  tags:
8
+ - routing
9
+ - grpo
10
+ - reinforcement-learning
11
+ - gguf
12
+ - lora
13
+ - unsloth
14
+ - trl
15
+ - qwen2
16
+ - llama-cpp
17
+ - contract-aware
18
+ - cost-optimization
19
+ - query-classification
20
  model_type: qwen2
21
  pipeline_tag: text-classification
22
  datasets:
23
+ - custom
24
  metrics:
25
+ - accuracy
26
  model-index:
27
+ - name: ModelGate-Router
28
+ results:
29
+ - task:
30
+ type: text-classification
31
+ name: Query Complexity Classification
32
+ metrics:
33
+ - type: accuracy
34
+ value: 83.3
35
+ name: Overall Accuracy (held-out, GGUF Q8_0)
36
+ - type: accuracy
37
+ value: 85.7
38
+ name: Medium Tier Accuracy
39
+ - type: latency
40
+ value: 62
41
+ name: Avg Latency (ms, CUDA)
42
  ---
43
 
44
  <p align="center">
 
257
  bench_mmlu.py # MMLU benchmark runner
258
  mmlu_questions.json # 60 real MMLU questions from HuggingFace
259
  start.sh # One-command startup
260
+ ```