mazesmazes
/

tiny-audio-lora

Automatic Speech Recognition

speech-recognition

Model card Files Files and versions

mazesmazes commited on Jan 8

Commit

21db0a1

·

verified ·

1 Parent(s): 150530c

Training in progress - step 500

Files changed (1) hide show

asr_modeling.py +3 -1

asr_modeling.py CHANGED Viewed

@@ -827,8 +827,10 @@ class ASRModel(PreTrainedModel, GenerationMixin):
         self.feature_extractor.save_pretrained(save_dir)
         # Save LoRA adapters if present (creates adapter_model.safetensors and adapter_config.json)
         if hasattr(self.language_model, "peft_config"):
-            self.language_model.save_pretrained(save_dir)
         # Add processor auto_map to preprocessor_config.json
         config_path = save_dir / "preprocessor_config.json"

         self.feature_extractor.save_pretrained(save_dir)
         # Save LoRA adapters if present (creates adapter_model.safetensors and adapter_config.json)
+        # Don't save embedding layers - the <audio> token embedding is never used
+        # (it's replaced with projected audio embeddings before the LLM sees it)
         if hasattr(self.language_model, "peft_config"):
+            self.language_model.save_pretrained(save_dir, save_embedding_layers=False)
         # Add processor auto_map to preprocessor_config.json
         config_path = save_dir / "preprocessor_config.json"