mazesmazes commited on
Commit
4649499
·
verified ·
1 Parent(s): c2627d2

Training in progress - step 50

Browse files
Files changed (1) hide show
  1. asr_modeling.py +2 -2
asr_modeling.py CHANGED
@@ -85,7 +85,7 @@ class ASRModel(PreTrainedModel, GenerationMixin):
85
  from peft import PeftModel
86
 
87
  # Get adapter directory (parent of adapter_config.json)
88
- adapter_path = Path(adapter_config).parent
89
  model.language_model = PeftModel.from_pretrained(
90
  model.language_model, adapter_path, is_trainable=False
91
  )
@@ -186,7 +186,7 @@ class ASRModel(PreTrainedModel, GenerationMixin):
186
  decoder_kwargs = {
187
  "attn_implementation": config.attn_implementation,
188
  "trust_remote_code": True,
189
- "tie_word_embeddings": True,
190
  "low_cpu_mem_usage": True,
191
  "dtype": dtype,
192
  }
 
85
  from peft import PeftModel
86
 
87
  # Get adapter directory (parent of adapter_config.json)
88
+ adapter_path = str(Path(adapter_config).parent)
89
  model.language_model = PeftModel.from_pretrained(
90
  model.language_model, adapter_path, is_trainable=False
91
  )
 
186
  decoder_kwargs = {
187
  "attn_implementation": config.attn_implementation,
188
  "trust_remote_code": True,
189
+ "tie_word_embeddings": False,
190
  "low_cpu_mem_usage": True,
191
  "dtype": dtype,
192
  }