Training in progress, step 1000

Files changed (5) hide show

adapter_config.json CHANGED Viewed

@@ -3,7 +3,7 @@
   "alpha_pattern": {},
   "arrow_config": null,
   "auto_mapping": null,
-  "base_model_name_or_path": "checkpoint-18000",
   "bias": "none",
   "corda_config": null,
   "ensure_weight_tying": false,
@@ -29,8 +29,8 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "v_proj",
-    "q_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

   "alpha_pattern": {},
   "arrow_config": null,
   "auto_mapping": null,
+  "base_model_name_or_path": "mazesmazes/tiny-audio",
   "bias": "none",
   "corda_config": null,
   "ensure_weight_tying": false,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "q_proj",
+    "v_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8041780442726f6dfe4977f7481dc095fc6641f80f8efd6b511ce6698c79c44c
 size 36715216

 version https://git-lfs.github.com/spec/v1
+oid sha256:b3d9525bb79a88033e2abf0745be479d053bc7e472082abe550fc21970f0171f
 size 36715216

config.json CHANGED Viewed

@@ -277,6 +277,7 @@
   ],
   "encoder_dim": 1280,
   "freeze_projector": false,
   "inference_warmup_tokens": 10,
   "label_smoothing": 0.0,
   "length_penalty": 1.0,
@@ -288,12 +289,6 @@
     "q_proj",
     "v_proj"
   ],
-  "mask_feature_length": 10,
-  "mask_feature_min_masks": 2,
-  "mask_feature_prob": 0.05,
-  "mask_time_length": 15,
-  "mask_time_min_masks": 2,
-  "mask_time_prob": 0.1,
   "max_new_tokens": 128,
   "min_new_tokens": 0,
   "model_dtype": "bfloat16",
@@ -302,6 +297,8 @@
   "num_beams": 1,
   "num_experts": 4,
   "num_experts_per_tok": 2,
   "pipeline_tag": "automatic-speech-recognition",
   "pretrained_model_path": "mazesmazes/tiny-audio",
   "projector_dropout": 0.0,
@@ -381,6 +378,7 @@
     "vocab_size": 151670
   },
   "text_model_id": "Qwen/Qwen3-0.6B",
   "transformers_version": "5.0.0.dev0",
   "use_cache": false,
   "use_lora": true,

   ],
   "encoder_dim": 1280,
   "freeze_projector": false,
+  "freq_mask_length": 10,
   "inference_warmup_tokens": 10,
   "label_smoothing": 0.0,
   "length_penalty": 1.0,
     "q_proj",
     "v_proj"
   ],
   "max_new_tokens": 128,
   "min_new_tokens": 0,
   "model_dtype": "bfloat16",
   "num_beams": 1,
   "num_experts": 4,
   "num_experts_per_tok": 2,
+  "num_freq_masks": 2,
+  "num_time_masks": 2,
   "pipeline_tag": "automatic-speech-recognition",
   "pretrained_model_path": "mazesmazes/tiny-audio",
   "projector_dropout": 0.0,
     "vocab_size": 151670
   },
   "text_model_id": "Qwen/Qwen3-0.6B",
+  "time_mask_length": 15,
   "transformers_version": "5.0.0.dev0",
   "use_cache": false,
   "use_lora": true,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1d884484522ff44b7cc38a1a0fd035e7fb7cb3d7954709726db5761e42ec88a3
 size 25172384

 version https://git-lfs.github.com/spec/v1
+oid sha256:82b3a651cbcecc1ac7e3a970b54119ae5a9c12b53c5e6f3fee991ab69340d5f3
 size 25172384

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6cb17eae71944b178ffca38182449645e5a12a962efd2d3eb01b9a84d725d5ed
 size 5201

 version https://git-lfs.github.com/spec/v1
+oid sha256:043f6ed7f53a2db67ac5f2249ac181fc40cb4bef3a20d41c2b1f48eae3176980
 size 5201