pere commited on
Commit
1b9bea6
·
1 Parent(s): 262ed92
Files changed (5) hide show
  1. .config.json.swn +0 -0
  2. .config.json.swo +0 -0
  3. .config.json.swp +0 -0
  4. config.json +1 -1
  5. run_step1.sh +1 -0
.config.json.swn ADDED
File without changes
.config.json.swo ADDED
File without changes
.config.json.swp ADDED
File without changes
config.json CHANGED
@@ -20,7 +20,7 @@
20
  "num_hidden_layers": 12,
21
  "pad_token_id": 1,
22
  "position_embedding_type": "absolute",
23
- "torch_dtype": "float32",
24
  "transformers_version": "4.14.0.dev0",
25
  "type_vocab_size": 1,
26
  "use_cache": true,
 
20
  "num_hidden_layers": 12,
21
  "pad_token_id": 1,
22
  "position_embedding_type": "absolute",
23
+ "torch_dtype": "bfloat16",
24
  "transformers_version": "4.14.0.dev0",
25
  "type_vocab_size": 1,
26
  "use_cache": true,
run_step1.sh CHANGED
@@ -21,5 +21,6 @@
21
  --preprocessing_num_workers="64" \
22
  --auth_token="True" \
23
  --static_learning_rate="True" \
 
24
  --adafactor \
25
  --push_to_hub
 
21
  --preprocessing_num_workers="64" \
22
  --auth_token="True" \
23
  --static_learning_rate="True" \
24
+ --dtype="bloat16" \
25
  --adafactor \
26
  --push_to_hub