Training in progress - step 50
Browse files- asr_modeling.py +2 -2
asr_modeling.py
CHANGED
|
@@ -85,7 +85,7 @@ class ASRModel(PreTrainedModel, GenerationMixin):
|
|
| 85 |
from peft import PeftModel
|
| 86 |
|
| 87 |
# Get adapter directory (parent of adapter_config.json)
|
| 88 |
-
adapter_path = Path(adapter_config).parent
|
| 89 |
model.language_model = PeftModel.from_pretrained(
|
| 90 |
model.language_model, adapter_path, is_trainable=False
|
| 91 |
)
|
|
@@ -186,7 +186,7 @@ class ASRModel(PreTrainedModel, GenerationMixin):
|
|
| 186 |
decoder_kwargs = {
|
| 187 |
"attn_implementation": config.attn_implementation,
|
| 188 |
"trust_remote_code": True,
|
| 189 |
-
"tie_word_embeddings":
|
| 190 |
"low_cpu_mem_usage": True,
|
| 191 |
"dtype": dtype,
|
| 192 |
}
|
|
|
|
| 85 |
from peft import PeftModel
|
| 86 |
|
| 87 |
# Get adapter directory (parent of adapter_config.json)
|
| 88 |
+
adapter_path = str(Path(adapter_config).parent)
|
| 89 |
model.language_model = PeftModel.from_pretrained(
|
| 90 |
model.language_model, adapter_path, is_trainable=False
|
| 91 |
)
|
|
|
|
| 186 |
decoder_kwargs = {
|
| 187 |
"attn_implementation": config.attn_implementation,
|
| 188 |
"trust_remote_code": True,
|
| 189 |
+
"tie_word_embeddings": False,
|
| 190 |
"low_cpu_mem_usage": True,
|
| 191 |
"dtype": dtype,
|
| 192 |
}
|