mazesmazes
/

tiny-audio-next-multiasr

Automatic Speech Recognition

feature-extraction

speech-recognition

Model card Files Files and versions

mazesmazes commited on 14 days ago

Commit

2d9a946

·

verified ·

1 Parent(s): 3ad8d10

Training in progress, step 2000

Files changed (3) hide show

config.json +4 -1
model.safetensors +1 -1
training_args.bin +1 -1

config.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "architectures": [
     "ASRModel"
   ],
-  "attn_implementation": "sdpa",
   "audio_config": {
     "_name_or_path": "zai-org/GLM-ASR-Nano-2512",
     "architectures": [
@@ -237,6 +237,8 @@
   "eos_token_id": 151645,
   "freeze_language_model": false,
   "freeze_projector": false,
   "length_penalty": 1.0,
   "llm_dim": 1024,
   "lora_alpha": 32,
@@ -262,6 +264,7 @@
   "pad_token_id": 151643,
   "pipeline_tag": "automatic-speech-recognition",
   "pretrained_model_path": "mazesmazes/tiny-audio-next-multiasr",
   "projector_hidden_dim": 1024,
   "projector_pool_stride": 4,
   "projector_type": "mlp",

   "architectures": [
     "ASRModel"
   ],
+  "attn_implementation": "flash_attention_2",
   "audio_config": {
     "_name_or_path": "zai-org/GLM-ASR-Nano-2512",
     "architectures": [
   "eos_token_id": 151645,
   "freeze_language_model": false,
   "freeze_projector": false,
+  "freeze_text_embed_tokens": false,
+  "label_smoothing": 0.1,
   "length_penalty": 1.0,
   "llm_dim": 1024,
   "lora_alpha": 32,
   "pad_token_id": 151643,
   "pipeline_tag": "automatic-speech-recognition",
   "pretrained_model_path": "mazesmazes/tiny-audio-next-multiasr",
+  "projector_dropout": 0.1,
   "projector_hidden_dim": 1024,
   "projector_pool_stride": 4,
   "projector_type": "mlp",

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3e3f1e1c7f213cd13966c1a0d965d94c0ce44eabf2d8e58431b80e3730a30a27
 size 2408324496

 version https://git-lfs.github.com/spec/v1
+oid sha256:6a68edaf462dc0dff106ee98009731f2fe32fa8e7ff830db243c3843f3f04d55
 size 2408324496

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6a7d229c5297761b25301e2a4804bd1c7a398f226ee380926cfefa3f38af5ff8
 size 5393

 version https://git-lfs.github.com/spec/v1
+oid sha256:93249932015f989823ad2ba998cfe00b3cf2b93f3e7532c45177ee0fb8635ad2
 size 5393