Spaces:
Sleeping
Sleeping
Upload transformers_config.json with huggingface_hub
Browse files- transformers_config.json +18 -2
transformers_config.json
CHANGED
|
@@ -82,7 +82,9 @@
|
|
| 82 |
"overlap_comm": true,
|
| 83 |
"reduce_scatter": true,
|
| 84 |
"reduce_bucket_size": 5e8,
|
| 85 |
-
"allgather_bucket_size": 5e8
|
|
|
|
|
|
|
| 86 |
},
|
| 87 |
"gradient_accumulation_steps": 4,
|
| 88 |
"gradient_clipping": 0.3,
|
|
@@ -114,6 +116,20 @@
|
|
| 114 |
"steps_per_print": 10,
|
| 115 |
"train_batch_size": "auto",
|
| 116 |
"train_micro_batch_size_per_gpu": "auto",
|
| 117 |
-
"wall_clock_breakdown": false
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 118 |
}
|
| 119 |
}
|
|
|
|
| 82 |
"overlap_comm": true,
|
| 83 |
"reduce_scatter": true,
|
| 84 |
"reduce_bucket_size": 5e8,
|
| 85 |
+
"allgather_bucket_size": 5e8,
|
| 86 |
+
"allgather_partitions": true,
|
| 87 |
+
"allgather_no_copy": true
|
| 88 |
},
|
| 89 |
"gradient_accumulation_steps": 4,
|
| 90 |
"gradient_clipping": 0.3,
|
|
|
|
| 116 |
"steps_per_print": 10,
|
| 117 |
"train_batch_size": "auto",
|
| 118 |
"train_micro_batch_size_per_gpu": "auto",
|
| 119 |
+
"wall_clock_breakdown": false,
|
| 120 |
+
"communication_data_type": "fp16",
|
| 121 |
+
"comms_logger": {
|
| 122 |
+
"enabled": false
|
| 123 |
+
},
|
| 124 |
+
"amp": {
|
| 125 |
+
"enabled": false
|
| 126 |
+
},
|
| 127 |
+
"aio": {
|
| 128 |
+
"block_size": 1048576,
|
| 129 |
+
"queue_depth": 8,
|
| 130 |
+
"thread_count": 1,
|
| 131 |
+
"single_submit": false,
|
| 132 |
+
"overlap_events": true
|
| 133 |
+
}
|
| 134 |
}
|
| 135 |
}
|