Spaces:

Luigi
/

tiny-scribe

Running

Luigi Claude Sonnet 4.5 commited on Jan 31

Commit

bc08390

1 Parent(s): 1f857e7

Reorder models by total parameter count (smallest to largest)

Correct order:
100M → 270M → 300M → 350M → 350M → 500M → 500M → 600M → 1.5B → 1.7B → 2.6B → 4B → 7B

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

Files changed (1) hide show

app.py +26 -26

app.py CHANGED Viewed

@@ -30,19 +30,6 @@ MAX_USABLE_CTX = 32768
 # Available models registry - ordered by parameter count (smallest to largest)
 AVAILABLE_MODELS = {
-    "granite4_tiny_q3": {
-        "name": "Granite 4.0 Tiny 7B (128K Context)",
-        "repo_id": "unsloth/granite-4.0-h-tiny-GGUF",
-        "filename": "*Q3_K_M.gguf",
-        "max_context": 131072,
-        "supports_toggle": False,
-        "inference_settings": {
-            "temperature": 0.0,
-            "top_p": 1.0,
-            "top_k": 0,
-            "repeat_penalty": 1.1,
-        },
-    },
     "falcon_h1_100m": {
         "name": "Falcon-H1 100M",
         "repo_id": "mradermacher/Falcon-H1-Tiny-Multilingual-100M-Instruct-GGUF",
@@ -152,19 +139,6 @@ AVAILABLE_MODELS = {
             "repeat_penalty": 1.05,
         },
     },
-    "lfm2_2_6b_transcript": {
-        "name": "LFM2 2.6B Transcript",
-        "repo_id": "mradermacher/LFM2-2.6B-Transcript-GGUF",
-        "filename": "*Q4_K_M.gguf",
-        "max_context": 32768,
-        "supports_toggle": False,
-        "inference_settings": {
-            "temperature": 0.3,
-            "top_p": 0.9,
-            "top_k": 40,
-            "repeat_penalty": 1.1,
-        },
-    },
     "qwen3_1.7b_q4": {
         "name": "Qwen3 1.7B Q4",
         "repo_id": "unsloth/Qwen3-1.7B-GGUF",
@@ -178,6 +152,19 @@ AVAILABLE_MODELS = {
             "repeat_penalty": 1.05,
         },
     },
     "qwen3_4b_thinking_q3": {
         "name": "Qwen3 4B Thinking (256K Context)",
         "repo_id": "unsloth/Qwen3-4B-Thinking-2507-GGUF",
@@ -191,6 +178,19 @@ AVAILABLE_MODELS = {
             "repeat_penalty": 1.0,
         },
     },
 }
 DEFAULT_MODEL_KEY = "qwen3_600m_q4"

 # Available models registry - ordered by parameter count (smallest to largest)
 AVAILABLE_MODELS = {
     "falcon_h1_100m": {
         "name": "Falcon-H1 100M",
         "repo_id": "mradermacher/Falcon-H1-Tiny-Multilingual-100M-Instruct-GGUF",
             "repeat_penalty": 1.05,
         },
     },
     "qwen3_1.7b_q4": {
         "name": "Qwen3 1.7B Q4",
         "repo_id": "unsloth/Qwen3-1.7B-GGUF",
             "repeat_penalty": 1.05,
         },
     },
+    "lfm2_2_6b_transcript": {
+        "name": "LFM2 2.6B Transcript",
+        "repo_id": "mradermacher/LFM2-2.6B-Transcript-GGUF",
+        "filename": "*Q4_K_M.gguf",
+        "max_context": 32768,
+        "supports_toggle": False,
+        "inference_settings": {
+            "temperature": 0.3,
+            "top_p": 0.9,
+            "top_k": 40,
+            "repeat_penalty": 1.1,
+        },
+    },
     "qwen3_4b_thinking_q3": {
         "name": "Qwen3 4B Thinking (256K Context)",
         "repo_id": "unsloth/Qwen3-4B-Thinking-2507-GGUF",
             "repeat_penalty": 1.0,
         },
     },
+    "granite4_tiny_q3": {
+        "name": "Granite 4.0 Tiny 7B (128K Context)",
+        "repo_id": "unsloth/granite-4.0-h-tiny-GGUF",
+        "filename": "*Q3_K_M.gguf",
+        "max_context": 131072,
+        "supports_toggle": False,
+        "inference_settings": {
+            "temperature": 0.0,
+            "top_p": 1.0,
+            "top_k": 0,
+            "repeat_penalty": 1.1,
+        },
+    },
 }
 DEFAULT_MODEL_KEY = "qwen3_600m_q4"