KRadim commited on
Commit
160fd24
·
verified ·
1 Parent(s): fde30c4

Upload QLoRA model checkpoint

Browse files
.gitattributes CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ model/ocdbt.process_0/d/4031c75894acb210608df91bd1a6ae73 filter=lfs diff=lfs merge=lfs -text
37
+ model/ocdbt.process_0/d/afee9522c684dba13719890caae7e6ae filter=lfs diff=lfs merge=lfs -text
38
+ model/ocdbt.process_0/d/dd4142f6221e2dbaeb499a7791f74d28 filter=lfs diff=lfs merge=lfs -text
39
+ model/ocdbt.process_0/d/fe9862bb771a1eb57def534a83e8e566 filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_function": "gelu_new",
3
+ "attn_pdrop": 0.1,
4
+ "bos_token_id": 50256,
5
+ "embd_pdrop": 0.1,
6
+ "eos_token_id": 50256,
7
+ "initializer_range": 0.02,
8
+ "layer_norm_epsilon": 1e-05,
9
+ "model_type": "gpt2",
10
+ "n_embd": 768,
11
+ "n_head": 12,
12
+ "n_inner": null,
13
+ "n_layer": 12,
14
+ "n_positions": 512,
15
+ "reorder_and_upcast_attn": false,
16
+ "resid_pdrop": 0.1,
17
+ "scale_attn_by_inverse_layer_idx": false,
18
+ "scale_attn_weights": true,
19
+ "summary_activation": null,
20
+ "summary_first_dropout": 0.1,
21
+ "summary_proj_to_labels": true,
22
+ "summary_type": "cls_index",
23
+ "summary_use_proj": true,
24
+ "transformers_version": "4.57.1",
25
+ "use_cache": true,
26
+ "vocab_size": 50257
27
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model/_CHECKPOINT_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"item_handlers": "orbax.checkpoint._src.handlers.pytree_checkpoint_handler.PyTreeCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1763990492527325362, "commit_timestamp_nsecs": 1763990494760634787, "custom_metadata": {}}
model/_METADATA ADDED
The diff for this file is too large to render. See raw diff
 
model/_sharding ADDED
@@ -0,0 +1 @@
 
 
1
+ {"YmxvY2tzLjAuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjAubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLm5vcm0xLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLm5vcm0xLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLm5vcm0yLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLm5vcm0yLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ua19wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ua19wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ua19wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ua19wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ub19wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ub19wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ub19wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ub19wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ucV9wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ucV9wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ucV9wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4ucV9wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4udl9wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4udl9wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4udl9wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmF0dG4udl9wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmZmbl91cC5saW5lYXIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmZmbl91cC5saW5lYXIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmZmbl91cC5sb3JhX0Eua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmZmbl91cC5sb3JhX0Iua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmZmbl9kb3duLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjEwLmZmbl9kb3duLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLm5vcm0xLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLm5vcm0xLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLm5vcm0yLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLm5vcm0yLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ua19wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ua19wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ua19wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ua19wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ub19wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ub19wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ub19wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ub19wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ucV9wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ucV9wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ucV9wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4ucV9wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4udl9wcm9qLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4udl9wcm9qLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4udl9wcm9qLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmF0dG4udl9wcm9qLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmZmbl91cC5saW5lYXIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmZmbl91cC5saW5lYXIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmZmbl91cC5sb3JhX0Eua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmZmbl91cC5sb3JhX0Iua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmZmbl9kb3duLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjExLmZmbl9kb3duLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjIubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjMubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjQubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjUubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjYubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjcubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjguZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjgubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjgubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjgubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjgubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi52X3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi52X3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi52X3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi52X3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5rX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5rX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5rX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5rX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5vX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5vX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5vX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5vX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5xX3Byb2oubG9yYV9BLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5xX3Byb2oubG9yYV9CLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5xX3Byb2oubGluZWFyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuYXR0bi5xX3Byb2oubGluZWFyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuZmZuX2Rvd24uYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuZmZuX2Rvd24ua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuZmZuX3VwLmxpbmVhci5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuZmZuX3VwLmxpbmVhci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuZmZuX3VwLmxvcmFfQS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkuZmZuX3VwLmxvcmFfQi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkubm9ybTEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkubm9ybTEuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkubm9ybTIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","YmxvY2tzLjkubm9ybTIuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","bG1faGVhZC5saW5lYXIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","bG1faGVhZC5saW5lYXIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","bG1faGVhZC5sb3JhX0Eua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","bG1faGVhZC5sb3JhX0Iua2VybmVsLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","bm9ybS5iaWFzLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","bm9ybS5zY2FsZS52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cG9zX2VtYmVkLmVtYmVkZGluZy52YWx1ZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","dG9rZW5fZW1iZWQuZW1iZWRkaW5nLnZhbHVl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}"}
model/array_metadatas/process_0 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "blocks.0.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.0.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.1.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.2.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.3.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.4.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.5.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.6.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.7.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.8.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.9.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.10.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.k_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.k_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.k_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.k_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.o_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.o_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.o_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.o_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.q_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.q_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.q_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.q_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.v_proj.linear.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.v_proj.linear.kernel.value", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.v_proj.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.attn.v_proj.lora_B.kernel.value", "write_shape": [8, 768], "chunk_shape": [8, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.ffn_down.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.ffn_down.kernel.value", "write_shape": [3072, 768], "chunk_shape": [3072, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.ffn_up.linear.bias.value", "write_shape": [3072], "chunk_shape": [3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.ffn_up.linear.kernel.value", "write_shape": [768, 3072], "chunk_shape": [768, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.ffn_up.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.ffn_up.lora_B.kernel.value", "write_shape": [8, 3072], "chunk_shape": [8, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.norm1.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.norm1.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.norm2.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.11.norm2.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "lm_head.linear.bias.value", "write_shape": [50257], "chunk_shape": [50257], "ext_metadata": null}}, {"array_metadata": {"param_name": "lm_head.linear.kernel.value", "write_shape": [768, 50257], "chunk_shape": [768, 50257], "ext_metadata": null}}, {"array_metadata": {"param_name": "lm_head.lora_A.kernel.value", "write_shape": [768, 8], "chunk_shape": [768, 8], "ext_metadata": null}}, {"array_metadata": {"param_name": "lm_head.lora_B.kernel.value", "write_shape": [8, 50257], "chunk_shape": [8, 50257], "ext_metadata": null}}, {"array_metadata": {"param_name": "norm.bias.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "norm.scale.value", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "pos_embed.embedding.value", "write_shape": [512, 768], "chunk_shape": [512, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "token_embed.embedding.value", "write_shape": [50257, 768], "chunk_shape": [50257, 768], "ext_metadata": null}}]}
model/d/6c59d3c732fc4394586c213aca6515ae ADDED
Binary file (3.42 kB). View file
 
model/manifest.ocdbt ADDED
Binary file (118 Bytes). View file
 
model/ocdbt.process_0/d/4031c75894acb210608df91bd1a6ae73 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bf6feed1ae10ab5af6cf0ab55b6a57f6e5901db0f981a3acd38f002b9479ca5
3
+ size 8712192
model/ocdbt.process_0/d/5c83ac2b5d01d9393aa67efee0d7ee5c ADDED
Binary file (248 Bytes). View file
 
model/ocdbt.process_0/d/a6d725c1c9b94477df4e79223f9cffd5 ADDED
Binary file (552 Bytes). View file
 
model/ocdbt.process_0/d/afee9522c684dba13719890caae7e6ae ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ef677ab785fbfa504abde919213bbda93c7fe2036e4ea1b781b6a22e01c8c02
3
+ size 157904896
model/ocdbt.process_0/d/dd4142f6221e2dbaeb499a7791f74d28 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef4b9af9bd2888d863fca46ca83a5f856d493e47fba13a8a7a9ca415c8c42403
3
+ size 933122
model/ocdbt.process_0/d/fe9862bb771a1eb57def534a83e8e566 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:194607996414f2d3baf05f219c498a4af6bca7f52af3ba6d298b36366c13c26c
3
+ size 173555712
model/ocdbt.process_0/manifest.ocdbt ADDED
Binary file (365 Bytes). View file
 
qlora_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "lora_rank": 8,
3
+ "lora_alpha": 16,
4
+ "lora_dropout": 0.05,
5
+ "quant_bits": 4
6
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<|endoftext|>",
3
+ "eos_token": "<|endoftext|>",
4
+ "pad_token": "<|endoftext|>",
5
+ "unk_token": "<|endoftext|>"
6
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "50256": {
5
+ "content": "<|endoftext|>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ }
12
+ },
13
+ "bos_token": "<|endoftext|>",
14
+ "clean_up_tokenization_spaces": false,
15
+ "eos_token": "<|endoftext|>",
16
+ "extra_special_tokens": {},
17
+ "model_max_length": 1024,
18
+ "pad_token": "<|endoftext|>",
19
+ "tokenizer_class": "GPT2Tokenizer",
20
+ "unk_token": "<|endoftext|>"
21
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff