updated
Browse files- .config.json.swn +0 -0
- .config.json.swo +0 -0
- .config.json.swp +0 -0
- config.json +1 -1
- run_step1.sh +1 -0
.config.json.swn
ADDED
|
File without changes
|
.config.json.swo
ADDED
|
File without changes
|
.config.json.swp
ADDED
|
File without changes
|
config.json
CHANGED
|
@@ -20,7 +20,7 @@
|
|
| 20 |
"num_hidden_layers": 12,
|
| 21 |
"pad_token_id": 1,
|
| 22 |
"position_embedding_type": "absolute",
|
| 23 |
-
"torch_dtype": "
|
| 24 |
"transformers_version": "4.14.0.dev0",
|
| 25 |
"type_vocab_size": 1,
|
| 26 |
"use_cache": true,
|
|
|
|
| 20 |
"num_hidden_layers": 12,
|
| 21 |
"pad_token_id": 1,
|
| 22 |
"position_embedding_type": "absolute",
|
| 23 |
+
"torch_dtype": "bfloat16",
|
| 24 |
"transformers_version": "4.14.0.dev0",
|
| 25 |
"type_vocab_size": 1,
|
| 26 |
"use_cache": true,
|
run_step1.sh
CHANGED
|
@@ -21,5 +21,6 @@
|
|
| 21 |
--preprocessing_num_workers="64" \
|
| 22 |
--auth_token="True" \
|
| 23 |
--static_learning_rate="True" \
|
|
|
|
| 24 |
--adafactor \
|
| 25 |
--push_to_hub
|
|
|
|
| 21 |
--preprocessing_num_workers="64" \
|
| 22 |
--auth_token="True" \
|
| 23 |
--static_learning_rate="True" \
|
| 24 |
+
--dtype="bloat16" \
|
| 25 |
--adafactor \
|
| 26 |
--push_to_hub
|