Spaces:
Sleeping
Sleeping
Update train_model.py
Browse files- train_model.py +2 -1
train_model.py
CHANGED
|
@@ -100,7 +100,8 @@ def initialize_model(task, model_name, vocab_size, sequence_length, hidden_size,
|
|
| 100 |
num_attention_heads=attention_heads,
|
| 101 |
intermediate_size=4 * hidden_size,
|
| 102 |
hidden_act='gelu',
|
| 103 |
-
use_cache=True
|
|
|
|
| 104 |
)
|
| 105 |
model = GPT2LMHeadModel(config)
|
| 106 |
logging.info("GPT2LMHeadModel initialized successfully.")
|
|
|
|
| 100 |
num_attention_heads=attention_heads,
|
| 101 |
intermediate_size=4 * hidden_size,
|
| 102 |
hidden_act='gelu',
|
| 103 |
+
use_cache=True,
|
| 104 |
+
truncation=False
|
| 105 |
)
|
| 106 |
model = GPT2LMHeadModel(config)
|
| 107 |
logging.info("GPT2LMHeadModel initialized successfully.")
|