Training in progress, step 19000
Browse files- config.json +7 -7
- model.safetensors +1 -1
config.json
CHANGED
|
@@ -119,10 +119,10 @@
|
|
| 119 |
"type": "audio"
|
| 120 |
}
|
| 121 |
},
|
| 122 |
-
"do_sample":
|
| 123 |
"downsample_rate": 5,
|
| 124 |
"dtype": "bfloat16",
|
| 125 |
-
"enable_thinking":
|
| 126 |
"encoder": {
|
| 127 |
"_name_or_path": "zai-org/GLM-ASR-Nano-2512",
|
| 128 |
"architectures": [
|
|
@@ -252,7 +252,7 @@
|
|
| 252 |
"up_proj",
|
| 253 |
"down_proj"
|
| 254 |
],
|
| 255 |
-
"max_new_tokens":
|
| 256 |
"min_new_tokens": 0,
|
| 257 |
"model_dtype": "bfloat16",
|
| 258 |
"model_type": "asr_model",
|
|
@@ -278,7 +278,7 @@
|
|
| 278 |
"repetition_penalty": 1.1,
|
| 279 |
"router_aux_loss_coef": 0.01,
|
| 280 |
"system_prompt": "",
|
| 281 |
-
"temperature": 0
|
| 282 |
"text_config": {
|
| 283 |
"_name_or_path": "HuggingFaceTB/SmolLM3-3B",
|
| 284 |
"architectures": [
|
|
@@ -392,11 +392,11 @@
|
|
| 392 |
},
|
| 393 |
"text_model_id": "HuggingFaceTB/SmolLM3-3B",
|
| 394 |
"time_mask_length": 100,
|
| 395 |
-
"top_k":
|
| 396 |
-
"top_p": 0.
|
| 397 |
"transformers_version": "5.0.0",
|
| 398 |
"use_cache": false,
|
| 399 |
"use_lora": false,
|
| 400 |
"use_specaugment": true,
|
| 401 |
"vocab_size": 128257
|
| 402 |
-
}
|
|
|
|
| 119 |
"type": "audio"
|
| 120 |
}
|
| 121 |
},
|
| 122 |
+
"do_sample": true,
|
| 123 |
"downsample_rate": 5,
|
| 124 |
"dtype": "bfloat16",
|
| 125 |
+
"enable_thinking": true,
|
| 126 |
"encoder": {
|
| 127 |
"_name_or_path": "zai-org/GLM-ASR-Nano-2512",
|
| 128 |
"architectures": [
|
|
|
|
| 252 |
"up_proj",
|
| 253 |
"down_proj"
|
| 254 |
],
|
| 255 |
+
"max_new_tokens": 128,
|
| 256 |
"min_new_tokens": 0,
|
| 257 |
"model_dtype": "bfloat16",
|
| 258 |
"model_type": "asr_model",
|
|
|
|
| 278 |
"repetition_penalty": 1.1,
|
| 279 |
"router_aux_loss_coef": 0.01,
|
| 280 |
"system_prompt": "",
|
| 281 |
+
"temperature": 1.0,
|
| 282 |
"text_config": {
|
| 283 |
"_name_or_path": "HuggingFaceTB/SmolLM3-3B",
|
| 284 |
"architectures": [
|
|
|
|
| 392 |
},
|
| 393 |
"text_model_id": "HuggingFaceTB/SmolLM3-3B",
|
| 394 |
"time_mask_length": 100,
|
| 395 |
+
"top_k": 0,
|
| 396 |
+
"top_p": 0.01,
|
| 397 |
"transformers_version": "5.0.0",
|
| 398 |
"use_cache": false,
|
| 399 |
"use_lora": false,
|
| 400 |
"use_specaugment": true,
|
| 401 |
"vocab_size": 128257
|
| 402 |
+
}
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14682440
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bdc328fd173116582a1b8d9c999bb438e9b939494190e5840ae74a3974173f5c
|
| 3 |
size 14682440
|