Fix alternating roles and use dtype instead of torch_dtype
Browse files
train.py
CHANGED
|
@@ -84,7 +84,7 @@ if tokenizer.pad_token is None:
|
|
| 84 |
print("Loading model...")
|
| 85 |
model = AutoModelForCausalLM.from_pretrained(
|
| 86 |
MODEL_ID,
|
| 87 |
-
|
| 88 |
device_map="auto",
|
| 89 |
)
|
| 90 |
|
|
|
|
| 84 |
print("Loading model...")
|
| 85 |
model = AutoModelForCausalLM.from_pretrained(
|
| 86 |
MODEL_ID,
|
| 87 |
+
dtype=torch.bfloat16,
|
| 88 |
device_map="auto",
|
| 89 |
)
|
| 90 |
|