mazesmazes commited on
Commit
cd9f829
·
verified ·
1 Parent(s): 0adf7b4

Training in progress, step 16000

Browse files
Files changed (2) hide show
  1. config.json +5 -5
  2. model.safetensors +1 -1
config.json CHANGED
@@ -119,7 +119,7 @@
119
  "type": "audio"
120
  }
121
  },
122
- "do_sample": false,
123
  "downsample_rate": 5,
124
  "dtype": "bfloat16",
125
  "enable_thinking": true,
@@ -252,7 +252,7 @@
252
  "up_proj",
253
  "down_proj"
254
  ],
255
- "max_new_tokens": 1024,
256
  "min_new_tokens": 0,
257
  "model_dtype": "bfloat16",
258
  "model_type": "asr_model",
@@ -275,10 +275,10 @@
275
  "qformer_num_heads": 16,
276
  "qformer_num_layers": 2,
277
  "qformer_window_size": 15,
278
- "repetition_penalty": 1.0,
279
  "router_aux_loss_coef": 0.01,
280
  "system_prompt": "",
281
- "temperature": 0.8,
282
  "text_config": {
283
  "_name_or_path": "HuggingFaceTB/SmolLM3-3B",
284
  "architectures": [
@@ -399,4 +399,4 @@
399
  "use_lora": false,
400
  "use_specaugment": true,
401
  "vocab_size": 128257
402
- }
 
119
  "type": "audio"
120
  }
121
  },
122
+ "do_sample": true,
123
  "downsample_rate": 5,
124
  "dtype": "bfloat16",
125
  "enable_thinking": true,
 
252
  "up_proj",
253
  "down_proj"
254
  ],
255
+ "max_new_tokens": 128,
256
  "min_new_tokens": 0,
257
  "model_dtype": "bfloat16",
258
  "model_type": "asr_model",
 
275
  "qformer_num_heads": 16,
276
  "qformer_num_layers": 2,
277
  "qformer_window_size": 15,
278
+ "repetition_penalty": 1.1,
279
  "router_aux_loss_coef": 0.01,
280
  "system_prompt": "",
281
+ "temperature": 1.0,
282
  "text_config": {
283
  "_name_or_path": "HuggingFaceTB/SmolLM3-3B",
284
  "architectures": [
 
399
  "use_lora": false,
400
  "use_specaugment": true,
401
  "vocab_size": 128257
402
+ }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e8f40cce2270ed5e01a0055f559d9010d5043000a3c056b90acd1af8b96ba92
3
  size 14682440
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ac436124a77178225ce77ad718d45ef2560fdbd6090403fdc4a19794e0faa7b
3
  size 14682440