mazesmazes commited on
Commit
2d9a946
·
verified ·
1 Parent(s): 3ad8d10

Training in progress, step 2000

Browse files
Files changed (3) hide show
  1. config.json +4 -1
  2. model.safetensors +1 -1
  3. training_args.bin +1 -1
config.json CHANGED
@@ -2,7 +2,7 @@
2
  "architectures": [
3
  "ASRModel"
4
  ],
5
- "attn_implementation": "sdpa",
6
  "audio_config": {
7
  "_name_or_path": "zai-org/GLM-ASR-Nano-2512",
8
  "architectures": [
@@ -237,6 +237,8 @@
237
  "eos_token_id": 151645,
238
  "freeze_language_model": false,
239
  "freeze_projector": false,
 
 
240
  "length_penalty": 1.0,
241
  "llm_dim": 1024,
242
  "lora_alpha": 32,
@@ -262,6 +264,7 @@
262
  "pad_token_id": 151643,
263
  "pipeline_tag": "automatic-speech-recognition",
264
  "pretrained_model_path": "mazesmazes/tiny-audio-next-multiasr",
 
265
  "projector_hidden_dim": 1024,
266
  "projector_pool_stride": 4,
267
  "projector_type": "mlp",
 
2
  "architectures": [
3
  "ASRModel"
4
  ],
5
+ "attn_implementation": "flash_attention_2",
6
  "audio_config": {
7
  "_name_or_path": "zai-org/GLM-ASR-Nano-2512",
8
  "architectures": [
 
237
  "eos_token_id": 151645,
238
  "freeze_language_model": false,
239
  "freeze_projector": false,
240
+ "freeze_text_embed_tokens": false,
241
+ "label_smoothing": 0.1,
242
  "length_penalty": 1.0,
243
  "llm_dim": 1024,
244
  "lora_alpha": 32,
 
264
  "pad_token_id": 151643,
265
  "pipeline_tag": "automatic-speech-recognition",
266
  "pretrained_model_path": "mazesmazes/tiny-audio-next-multiasr",
267
+ "projector_dropout": 0.1,
268
  "projector_hidden_dim": 1024,
269
  "projector_pool_stride": 4,
270
  "projector_type": "mlp",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e3f1e1c7f213cd13966c1a0d965d94c0ce44eabf2d8e58431b80e3730a30a27
3
  size 2408324496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a68edaf462dc0dff106ee98009731f2fe32fa8e7ff830db243c3843f3f04d55
3
  size 2408324496
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a7d229c5297761b25301e2a4804bd1c7a398f226ee380926cfefa3f38af5ff8
3
  size 5393
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93249932015f989823ad2ba998cfe00b3cf2b93f3e7532c45177ee0fb8635ad2
3
  size 5393