Upload QLoRA model checkpoint
Browse files- .gitattributes +4 -0
- config.json +27 -0
- merges.txt +0 -0
- model/_CHECKPOINT_METADATA +1 -0
- model/_METADATA +0 -0
- model/_sharding +1 -0
- model/array_metadatas/process_0 +1 -0
- model/d/6c59d3c732fc4394586c213aca6515ae +0 -0
- model/manifest.ocdbt +0 -0
- model/ocdbt.process_0/d/4031c75894acb210608df91bd1a6ae73 +3 -0
- model/ocdbt.process_0/d/5c83ac2b5d01d9393aa67efee0d7ee5c +0 -0
- model/ocdbt.process_0/d/a6d725c1c9b94477df4e79223f9cffd5 +0 -0
- model/ocdbt.process_0/d/afee9522c684dba13719890caae7e6ae +3 -0
- model/ocdbt.process_0/d/dd4142f6221e2dbaeb499a7791f74d28 +3 -0
- model/ocdbt.process_0/d/fe9862bb771a1eb57def534a83e8e566 +3 -0
- model/ocdbt.process_0/manifest.ocdbt +0 -0
- qlora_config.json +6 -0
- special_tokens_map.json +6 -0
- tokenizer.json +0 -0
- tokenizer_config.json +21 -0
- vocab.json +0 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
model/ocdbt.process_0/d/4031c75894acb210608df91bd1a6ae73 filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
model/ocdbt.process_0/d/afee9522c684dba13719890caae7e6ae filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
model/ocdbt.process_0/d/dd4142f6221e2dbaeb499a7791f74d28 filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
model/ocdbt.process_0/d/fe9862bb771a1eb57def534a83e8e566 filter=lfs diff=lfs merge=lfs -text
|
config.json
ADDED
|
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"activation_function": "gelu_new",
|
| 3 |
+
"attn_pdrop": 0.1,
|
| 4 |
+
"bos_token_id": 50256,
|
| 5 |
+
"embd_pdrop": 0.1,
|
| 6 |
+
"eos_token_id": 50256,
|
| 7 |
+
"initializer_range": 0.02,
|
| 8 |
+
"layer_norm_epsilon": 1e-05,
|
| 9 |
+
"model_type": "gpt2",
|
| 10 |
+
"n_embd": 768,
|
| 11 |
+
"n_head": 12,
|
| 12 |
+
"n_inner": null,
|
| 13 |
+
"n_layer": 12,
|
| 14 |
+
"n_positions": 512,
|
| 15 |
+
"reorder_and_upcast_attn": false,
|
| 16 |
+
"resid_pdrop": 0.1,
|
| 17 |
+
"scale_attn_by_inverse_layer_idx": false,
|
| 18 |
+
"scale_attn_weights": true,
|
| 19 |
+
"summary_activation": null,
|
| 20 |
+
"summary_first_dropout": 0.1,
|
| 21 |
+
"summary_proj_to_labels": true,
|
| 22 |
+
"summary_type": "cls_index",
|
| 23 |
+
"summary_use_proj": true,
|
| 24 |
+
"transformers_version": "4.57.1",
|
| 25 |
+
"use_cache": true,
|
| 26 |
+
"vocab_size": 50257
|
| 27 |
+
}
|
merges.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
model/_CHECKPOINT_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"item_handlers": "orbax.checkpoint._src.handlers.pytree_checkpoint_handler.PyTreeCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1763990492527325362, "commit_timestamp_nsecs": 1763990494760634787, "custom_metadata": {}}
|
model/_METADATA
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
model/_sharding
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"YmxvY2tzLjAuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLm5vcm0xLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLm5vcm0xLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLm5vcm0yLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLm5vcm0yLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ua19wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ua19wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ua19wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ua19wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ub19wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ub19wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ub19wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ub19wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ucV9wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ucV9wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ucV9wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ucV9wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4udl9wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4udl9wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4udl9wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4udl9wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmZmbl91cC5saW5lYXIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmZmbl91cC5saW5lYXIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmZmbl91cC5sb3JhX0Eua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmZmbl91cC5sb3JhX0Iua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmZmbl9kb3duLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmZmbl9kb3duLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLm5vcm0xLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLm5vcm0xLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLm5vcm0yLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLm5vcm0yLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ua19wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ua19wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ua19wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ua19wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ub19wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ub19wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ub19wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ub19wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ucV9wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ucV9wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ucV9wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ucV9wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4udl9wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4udl9wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4udl9wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4udl9wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmZmbl91cC5saW5lYXIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmZmbl91cC5saW5lYXIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmZmbl91cC5sb3JhX0Eua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmZmbl91cC5sb3JhX0Iua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmZmbl9kb3duLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmZmbl9kb3duLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjgubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjgubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjgubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjgubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","bG1faGVhZC5saW5lYXIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","bG1faGVhZC5saW5lYXIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","bG1faGVhZC5sb3JhX0Eua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","bG1faGVhZC5sb3JhX0Iua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","bm9ybS5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","bm9ybS5zY2FsZS52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cG9zX2VtYmVkLmVtYmVkZGluZy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","dG9rZW5fZW1iZWQuZW1iZWRkaW5nLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}"}
|
model/array_metadatas/process_0
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "blocks.0.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "lm_head.linear.bias.value", "write_shape": [50257], "chunk_shape": [50257], "ext_metadata": null}}, {"array_metadata": {"param_name": "lm_head.linear.kernel.value", "write_shape": [768, 50257], "chunk_shape": [768, 50257], "ext_metadata": null}}, {"array_metadata": {"param_name": "lm_head.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "lm_head.lora_B.kernel.value", "write_shape": [8, 50257], "chunk_shape": [8, 50257], "ext_metadata": null}}, {"array_metadata": {"param_name": "norm.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "norm.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "pos_embed.embedding.value", "write_shape": [512, 768], "chunk_shape": [512, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "token_embed.embedding.value", "write_shape": [50257, 768], "chunk_shape": [50257, 768], "ext_metadata": null}}]}
|
model/d/6c59d3c732fc4394586c213aca6515ae
ADDED
|
Binary file (3.42 kB). View file
|
|
|
model/manifest.ocdbt
ADDED
|
Binary file (118 Bytes). View file
|
|
|
model/ocdbt.process_0/d/4031c75894acb210608df91bd1a6ae73
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9bf6feed1ae10ab5af6cf0ab55b6a57f6e5901db0f981a3acd38f002b9479ca5
|
| 3 |
+
size 8712192
|
model/ocdbt.process_0/d/5c83ac2b5d01d9393aa67efee0d7ee5c
ADDED
|
Binary file (248 Bytes). View file
|
|
|
model/ocdbt.process_0/d/a6d725c1c9b94477df4e79223f9cffd5
ADDED
|
Binary file (552 Bytes). View file
|
|
|
model/ocdbt.process_0/d/afee9522c684dba13719890caae7e6ae
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ef677ab785fbfa504abde919213bbda93c7fe2036e4ea1b781b6a22e01c8c02
|
| 3 |
+
size 157904896
|
model/ocdbt.process_0/d/dd4142f6221e2dbaeb499a7791f74d28
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef4b9af9bd2888d863fca46ca83a5f856d493e47fba13a8a7a9ca415c8c42403
|
| 3 |
+
size 933122
|
model/ocdbt.process_0/d/fe9862bb771a1eb57def534a83e8e566
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:194607996414f2d3baf05f219c498a4af6bca7f52af3ba6d298b36366c13c26c
|
| 3 |
+
size 173555712
|
model/ocdbt.process_0/manifest.ocdbt
ADDED
|
Binary file (365 Bytes). View file
|
|
|
qlora_config.json
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"lora_rank": 8,
|
| 3 |
+
"lora_alpha": 16,
|
| 4 |
+
"lora_dropout": 0.05,
|
| 5 |
+
"quant_bits": 4
|
| 6 |
+
}
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": "<|endoftext|>",
|
| 3 |
+
"eos_token": "<|endoftext|>",
|
| 4 |
+
"pad_token": "<|endoftext|>",
|
| 5 |
+
"unk_token": "<|endoftext|>"
|
| 6 |
+
}
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_prefix_space": false,
|
| 3 |
+
"added_tokens_decoder": {
|
| 4 |
+
"50256": {
|
| 5 |
+
"content": "<|endoftext|>",
|
| 6 |
+
"lstrip": false,
|
| 7 |
+
"normalized": true,
|
| 8 |
+
"rstrip": false,
|
| 9 |
+
"single_word": false,
|
| 10 |
+
"special": true
|
| 11 |
+
}
|
| 12 |
+
},
|
| 13 |
+
"bos_token": "<|endoftext|>",
|
| 14 |
+
"clean_up_tokenization_spaces": false,
|
| 15 |
+
"eos_token": "<|endoftext|>",
|
| 16 |
+
"extra_special_tokens": {},
|
| 17 |
+
"model_max_length": 1024,
|
| 18 |
+
"pad_token": "<|endoftext|>",
|
| 19 |
+
"tokenizer_class": "GPT2Tokenizer",
|
| 20 |
+
"unk_token": "<|endoftext|>"
|
| 21 |
+
}
|
vocab.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|