Training in progress, step 16000
Browse files- config.json +5 -5
- model.safetensors +1 -1
config.json
CHANGED
|
@@ -119,7 +119,7 @@
|
|
| 119 |
"type": "audio"
|
| 120 |
}
|
| 121 |
},
|
| 122 |
-
"do_sample":
|
| 123 |
"downsample_rate": 5,
|
| 124 |
"dtype": "bfloat16",
|
| 125 |
"enable_thinking": true,
|
|
@@ -252,7 +252,7 @@
|
|
| 252 |
"up_proj",
|
| 253 |
"down_proj"
|
| 254 |
],
|
| 255 |
-
"max_new_tokens":
|
| 256 |
"min_new_tokens": 0,
|
| 257 |
"model_dtype": "bfloat16",
|
| 258 |
"model_type": "asr_model",
|
|
@@ -275,10 +275,10 @@
|
|
| 275 |
"qformer_num_heads": 16,
|
| 276 |
"qformer_num_layers": 2,
|
| 277 |
"qformer_window_size": 15,
|
| 278 |
-
"repetition_penalty": 1.
|
| 279 |
"router_aux_loss_coef": 0.01,
|
| 280 |
"system_prompt": "",
|
| 281 |
-
"temperature": 0
|
| 282 |
"text_config": {
|
| 283 |
"_name_or_path": "HuggingFaceTB/SmolLM3-3B",
|
| 284 |
"architectures": [
|
|
@@ -399,4 +399,4 @@
|
|
| 399 |
"use_lora": false,
|
| 400 |
"use_specaugment": true,
|
| 401 |
"vocab_size": 128257
|
| 402 |
-
}
|
|
|
|
| 119 |
"type": "audio"
|
| 120 |
}
|
| 121 |
},
|
| 122 |
+
"do_sample": true,
|
| 123 |
"downsample_rate": 5,
|
| 124 |
"dtype": "bfloat16",
|
| 125 |
"enable_thinking": true,
|
|
|
|
| 252 |
"up_proj",
|
| 253 |
"down_proj"
|
| 254 |
],
|
| 255 |
+
"max_new_tokens": 128,
|
| 256 |
"min_new_tokens": 0,
|
| 257 |
"model_dtype": "bfloat16",
|
| 258 |
"model_type": "asr_model",
|
|
|
|
| 275 |
"qformer_num_heads": 16,
|
| 276 |
"qformer_num_layers": 2,
|
| 277 |
"qformer_window_size": 15,
|
| 278 |
+
"repetition_penalty": 1.1,
|
| 279 |
"router_aux_loss_coef": 0.01,
|
| 280 |
"system_prompt": "",
|
| 281 |
+
"temperature": 1.0,
|
| 282 |
"text_config": {
|
| 283 |
"_name_or_path": "HuggingFaceTB/SmolLM3-3B",
|
| 284 |
"architectures": [
|
|
|
|
| 399 |
"use_lora": false,
|
| 400 |
"use_specaugment": true,
|
| 401 |
"vocab_size": 128257
|
| 402 |
+
}
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14682440
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8ac436124a77178225ce77ad718d45ef2560fdbd6090403fdc4a19794e0faa7b
|
| 3 |
size 14682440
|