Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +54 -0
- clip/_CHECKPOINT_METADATA +1 -0
- clip/_METADATA +0 -0
- clip/_sharding +0 -0
- clip/array_metadatas/process_0 +1 -0
- clip/array_metadatas/process_1 +1 -0
- clip/array_metadatas/process_10 +1 -0
- clip/array_metadatas/process_11 +1 -0
- clip/array_metadatas/process_12 +1 -0
- clip/array_metadatas/process_13 +1 -0
- clip/array_metadatas/process_14 +1 -0
- clip/array_metadatas/process_15 +1 -0
- clip/array_metadatas/process_2 +1 -0
- clip/array_metadatas/process_3 +1 -0
- clip/array_metadatas/process_4 +1 -0
- clip/array_metadatas/process_5 +1 -0
- clip/array_metadatas/process_6 +1 -0
- clip/array_metadatas/process_7 +1 -0
- clip/array_metadatas/process_8 +1 -0
- clip/array_metadatas/process_9 +1 -0
- clip/commit_success.txt +1 -0
- clip/d/7e2d09763ea8c665446b1463911fecba +3 -0
- clip/manifest.ocdbt +0 -0
- clip/ocdbt.process_0/d/194e2e8a333c75b459dcbcabefc11ddf +3 -0
- clip/ocdbt.process_0/d/965dd2d0c3740930297faa2be0096920 +0 -0
- clip/ocdbt.process_0/d/edeaf853ce695a508f6ffd840d9e2cde +0 -0
- clip/ocdbt.process_0/d/f30727178cee928dc5493d096dbbb2b5 +3 -0
- clip/ocdbt.process_0/manifest.ocdbt +0 -0
- clip/ocdbt.process_1/d/691ea04338b06a7eecec2b608e581e38 +3 -0
- clip/ocdbt.process_1/d/739739ab217cd483129948a9bb18d5d9 +3 -0
- clip/ocdbt.process_1/manifest.ocdbt +0 -0
- clip/ocdbt.process_10/d/7901b44c8733386abb4c980dbca843da +3 -0
- clip/ocdbt.process_10/d/eb198fe0c1c1da5473e8c8e06bd69585 +3 -0
- clip/ocdbt.process_10/manifest.ocdbt +0 -0
- clip/ocdbt.process_11/d/2352515fa2894d9c7068e8b0b23df029 +3 -0
- clip/ocdbt.process_11/d/f98418d050a019f386eb358b8ce48b67 +3 -0
- clip/ocdbt.process_11/manifest.ocdbt +0 -0
- clip/ocdbt.process_12/d/643e52a5537736bc9b7de2e8453f48d4 +3 -0
- clip/ocdbt.process_12/d/cdf37d2f7525c256876010227ccfe676 +3 -0
- clip/ocdbt.process_12/manifest.ocdbt +0 -0
- clip/ocdbt.process_13/d/7067050dc78e306ec075b19bbd5e28e9 +3 -0
- clip/ocdbt.process_13/d/84e862e53202591d3306175afe4a42a9 +3 -0
- clip/ocdbt.process_13/manifest.ocdbt +0 -0
- clip/ocdbt.process_14/d/707f7e3db4b13ff05269d2ee5b337b87 +3 -0
- clip/ocdbt.process_14/d/fedd638294aa456389cee462fcfa539e +3 -0
- clip/ocdbt.process_14/manifest.ocdbt +0 -0
- clip/ocdbt.process_15/d/738ea6b2bc492be58942c98526816975 +3 -0
- clip/ocdbt.process_15/d/d4533d57d4757deab44242019ed789d6 +3 -0
- clip/ocdbt.process_15/manifest.ocdbt +0 -0
- clip/ocdbt.process_2/d/5bb38d5ee9cabe414133589ceeeb5c1a +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,57 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
clip/d/7e2d09763ea8c665446b1463911fecba filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
clip/ocdbt.process_0/d/194e2e8a333c75b459dcbcabefc11ddf filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
clip/ocdbt.process_0/d/f30727178cee928dc5493d096dbbb2b5 filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
clip/ocdbt.process_1/d/691ea04338b06a7eecec2b608e581e38 filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
clip/ocdbt.process_1/d/739739ab217cd483129948a9bb18d5d9 filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
clip/ocdbt.process_10/d/7901b44c8733386abb4c980dbca843da filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
clip/ocdbt.process_10/d/eb198fe0c1c1da5473e8c8e06bd69585 filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
clip/ocdbt.process_11/d/2352515fa2894d9c7068e8b0b23df029 filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
clip/ocdbt.process_11/d/f98418d050a019f386eb358b8ce48b67 filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
clip/ocdbt.process_12/d/643e52a5537736bc9b7de2e8453f48d4 filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
clip/ocdbt.process_12/d/cdf37d2f7525c256876010227ccfe676 filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
clip/ocdbt.process_13/d/7067050dc78e306ec075b19bbd5e28e9 filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
clip/ocdbt.process_13/d/84e862e53202591d3306175afe4a42a9 filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
clip/ocdbt.process_14/d/707f7e3db4b13ff05269d2ee5b337b87 filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
clip/ocdbt.process_14/d/fedd638294aa456389cee462fcfa539e filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
clip/ocdbt.process_15/d/738ea6b2bc492be58942c98526816975 filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
clip/ocdbt.process_15/d/d4533d57d4757deab44242019ed789d6 filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
clip/ocdbt.process_2/d/5bb38d5ee9cabe414133589ceeeb5c1a filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
clip/ocdbt.process_2/d/c6e4ef1b5ca84fdccbd09072c6337db6 filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
clip/ocdbt.process_3/d/1504395547eb3e2b32ecaf5f5a6964e9 filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
clip/ocdbt.process_3/d/3bde804ea84b7c1d083ccc535cfc60d1 filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
clip/ocdbt.process_4/d/310b64c7785e9052b248a3ded7813dba filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
clip/ocdbt.process_4/d/448f7a43d7c84e0245f3bafaef6ed885 filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
clip/ocdbt.process_5/d/0e596754b897a4eb0f2396e115cf5f99 filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
clip/ocdbt.process_5/d/b6a2877894c471bca74219ccdc79bb9f filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
clip/ocdbt.process_6/d/6cf9716d03aa4ad9a01f5874cc2c5777 filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
clip/ocdbt.process_6/d/9dd2b4fc543376833aba7b4a26c851fa filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
clip/ocdbt.process_7/d/1bd09540701f3f22958cd44d6ce59467 filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
clip/ocdbt.process_7/d/857c2552b4438536c163d98780a7c017 filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
clip/ocdbt.process_8/d/2180e4cbf3bd78beace7b88872672410 filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
clip/ocdbt.process_8/d/db6ef0af4e554ece53014db163340bca filter=lfs diff=lfs merge=lfs -text
|
| 67 |
+
clip/ocdbt.process_9/d/45ca79537fd19104d538f07f03edcc11 filter=lfs diff=lfs merge=lfs -text
|
| 68 |
+
clip/ocdbt.process_9/d/67499b45b933e482ec2bbf5821989dee filter=lfs diff=lfs merge=lfs -text
|
| 69 |
+
matrix-game-init/ocdbt.process_0/d/1aafacd9f72d2ca8e352e3291197be39 filter=lfs diff=lfs merge=lfs -text
|
| 70 |
+
matrix-game-init/ocdbt.process_0/d/1df984befa818857ba758481a22bd23d filter=lfs diff=lfs merge=lfs -text
|
| 71 |
+
matrix-game-init/ocdbt.process_0/d/5cad4a6b650139025002cc4cbe2c3de1 filter=lfs diff=lfs merge=lfs -text
|
| 72 |
+
matrix-game-init/ocdbt.process_0/d/a21cfffc746e13b18cab1d8903e3b879 filter=lfs diff=lfs merge=lfs -text
|
| 73 |
+
solaris/d/1f2bd345c5f842d245b2a2576ca5eba5 filter=lfs diff=lfs merge=lfs -text
|
| 74 |
+
solaris/ocdbt.process_0/d/79213e6e5a2575fcd3aa3609c5134550 filter=lfs diff=lfs merge=lfs -text
|
| 75 |
+
solaris/ocdbt.process_0/d/e2802600b384d14b0b74c2118702872d filter=lfs diff=lfs merge=lfs -text
|
| 76 |
+
solaris/ocdbt.process_1/d/4f2252430844216076bc041febdcfe86 filter=lfs diff=lfs merge=lfs -text
|
| 77 |
+
solaris/ocdbt.process_1/d/d5ba8369ddd27d68c5158213f940fedc filter=lfs diff=lfs merge=lfs -text
|
| 78 |
+
solaris/ocdbt.process_2/d/4c0119143b609fb979eb2834ec8269cd filter=lfs diff=lfs merge=lfs -text
|
| 79 |
+
solaris/ocdbt.process_2/d/fd8f087a5ad6e097686c97a1b4929cdd filter=lfs diff=lfs merge=lfs -text
|
| 80 |
+
solaris/ocdbt.process_3/d/7467364804cf6d4515dc2fa747563d60 filter=lfs diff=lfs merge=lfs -text
|
| 81 |
+
solaris/ocdbt.process_3/d/b637346fcb25d3141040cbb759bd363a filter=lfs diff=lfs merge=lfs -text
|
| 82 |
+
solaris/ocdbt.process_4/d/5169d76b0943b3194206644b8a99c628 filter=lfs diff=lfs merge=lfs -text
|
| 83 |
+
solaris/ocdbt.process_4/d/d123832151d708ce71920baf9b071aec filter=lfs diff=lfs merge=lfs -text
|
| 84 |
+
solaris/ocdbt.process_5/d/31f602e4711284170187bf724b5b29d4 filter=lfs diff=lfs merge=lfs -text
|
| 85 |
+
solaris/ocdbt.process_5/d/970fd567e6b82c3b965da38c0d461f8d filter=lfs diff=lfs merge=lfs -text
|
| 86 |
+
solaris/ocdbt.process_6/d/680c3d05b84dffc3aab1d70d59a97a6b filter=lfs diff=lfs merge=lfs -text
|
| 87 |
+
solaris/ocdbt.process_6/d/c9c1b0cd7facea8d15d5c995a5436c46 filter=lfs diff=lfs merge=lfs -text
|
| 88 |
+
solaris/ocdbt.process_7/d/79f0274fbd50bccb91b021cde434cca4 filter=lfs diff=lfs merge=lfs -text
|
| 89 |
+
solaris/ocdbt.process_7/d/91dcd8174f72cfe778349a126ebf5144 filter=lfs diff=lfs merge=lfs -text
|
clip/_CHECKPOINT_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"item_handlers": "orbax.checkpoint._src.handlers.standard_checkpoint_handler.StandardCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1761250920872137813, "commit_timestamp_nsecs": 1761250926254865703, "custom_metadata": {}}
|
clip/_METADATA
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
clip/_sharding
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
clip/array_metadatas/process_0
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_1
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_10
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_11
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_12
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_13
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_14
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_15
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_2
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_3
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_4
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_5
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_6
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_7
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_8
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/array_metadatas/process_9
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "model.cls_embedding.value", "write_shape": [1, 1, 20], "chunk_shape": [1, 1, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.head.value", "write_shape": [20, 1024], "chunk_shape": [20, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.patch_embedding.kernel.value", "write_shape": [14, 14, 3, 20], "chunk_shape": [14, 14, 3, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pos_embedding.value", "write_shape": [1, 257, 20], "chunk_shape": [1, 257, 20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.post_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.pre_norm.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.0.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.1.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.2.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.3.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.4.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.5.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.6.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.7.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.8.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.9.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.10.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.11.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.12.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.13.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.14.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.15.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.16.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.17.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.18.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.19.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.20.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.21.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.22.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.23.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.24.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.25.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.26.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.27.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.28.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.29.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.30.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.proj.kernel.value", "write_shape": [20, 1280], "chunk_shape": [20, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.bias.value", "write_shape": [60], "chunk_shape": [60], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.attn.to_qkv.kernel.value", "write_shape": [20, 3840], "chunk_shape": [20, 3840], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.bias.value", "write_shape": [80], "chunk_shape": [80], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.0.kernel.value", "write_shape": [20, 5120], "chunk_shape": [20, 5120], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.mlp.layers.2.kernel.value", "write_shape": [80, 1280], "chunk_shape": [80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm1.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.bias.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}, {"array_metadata": {"param_name": "model.transformer.31.norm2.scale.value", "write_shape": [20], "chunk_shape": [20], "ext_metadata": null}}]}
|
clip/commit_success.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
Checkpoint commit was successful to gs://solaris-central1/solaris/model/pretrained/clip
|
clip/d/7e2d09763ea8c665446b1463911fecba
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2819382df207de5527ea9b843e43f6dfdf2245a4f85c703578b823260890fb97
|
| 3 |
+
size 1482926
|
clip/manifest.ocdbt
ADDED
|
Binary file (121 Bytes). View file
|
|
|
clip/ocdbt.process_0/d/194e2e8a333c75b459dcbcabefc11ddf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c3ca79d00330f5733133f476202df3a83314a99308d5d1636d32b50d33ea8d7a
|
| 3 |
+
size 59785516
|
clip/ocdbt.process_0/d/965dd2d0c3740930297faa2be0096920
ADDED
|
Binary file (202 Bytes). View file
|
|
|
clip/ocdbt.process_0/d/edeaf853ce695a508f6ffd840d9e2cde
ADDED
|
Binary file (722 Bytes). View file
|
|
|
clip/ocdbt.process_0/d/f30727178cee928dc5493d096dbbb2b5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4f5930a2cc0b90cccc8d2a25fbd40adeabf56253ce40373f4ee6a7dbc5736eac
|
| 3 |
+
size 15856746
|
clip/ocdbt.process_0/manifest.ocdbt
ADDED
|
Binary file (265 Bytes). View file
|
|
|
clip/ocdbt.process_1/d/691ea04338b06a7eecec2b608e581e38
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5427db1ae84657b9983a56a5152616907e1c0b57347174fc77cd61fb9b4749f0
|
| 3 |
+
size 57232799
|
clip/ocdbt.process_1/d/739739ab217cd483129948a9bb18d5d9
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a24113b4f6c0c3a33a00b7c443974536f45ec514204cabea55dcc58583db31a5
|
| 3 |
+
size 18408936
|
clip/ocdbt.process_1/manifest.ocdbt
ADDED
|
Binary file (184 Bytes). View file
|
|
|
clip/ocdbt.process_10/d/7901b44c8733386abb4c980dbca843da
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5ba1010f43dd19f4290c5eb100e926785a0a4eda99373e8ee18f7b71c2a2ff3
|
| 3 |
+
size 59509118
|
clip/ocdbt.process_10/d/eb198fe0c1c1da5473e8c8e06bd69585
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:63f256ef2dc25399cb3ed2877174d616123856d0779bf4ed30981d81818a2fd7
|
| 3 |
+
size 16133783
|
clip/ocdbt.process_10/manifest.ocdbt
ADDED
|
Binary file (184 Bytes). View file
|
|
|
clip/ocdbt.process_11/d/2352515fa2894d9c7068e8b0b23df029
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f87f85c1cda4cc7a1e3ae987d776b72df648ba2693e71814c2f1f95c042a95f3
|
| 3 |
+
size 27551147
|
clip/ocdbt.process_11/d/f98418d050a019f386eb358b8ce48b67
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c18be45bf96098389cebfc8a77734b4fea346d09b7b97668c33d1192d6988f4
|
| 3 |
+
size 48124855
|
clip/ocdbt.process_11/manifest.ocdbt
ADDED
|
Binary file (184 Bytes). View file
|
|
|
clip/ocdbt.process_12/d/643e52a5537736bc9b7de2e8453f48d4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bb9fbec7619c13121b65934c6d7d94d60fe718d91dce220a1fa676f29048b2e0
|
| 3 |
+
size 28157157
|
clip/ocdbt.process_12/d/cdf37d2f7525c256876010227ccfe676
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0f11d4bb734af134aae65ee89861dfb69bd41abffeaade46d9b94747250cf810
|
| 3 |
+
size 47546972
|
clip/ocdbt.process_12/manifest.ocdbt
ADDED
|
Binary file (184 Bytes). View file
|
|
|
clip/ocdbt.process_13/d/7067050dc78e306ec075b19bbd5e28e9
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a545cad5b6309d28cc9fb82e4496589cab589ffffbe0c82896344941d4507d14
|
| 3 |
+
size 38188634
|
clip/ocdbt.process_13/d/84e862e53202591d3306175afe4a42a9
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd05d370eedbce9a9805088d72d28ef23bb621eb93b3aa96d88c45e66f2a1f6b
|
| 3 |
+
size 37538336
|
clip/ocdbt.process_13/manifest.ocdbt
ADDED
|
Binary file (184 Bytes). View file
|
|
|
clip/ocdbt.process_14/d/707f7e3db4b13ff05269d2ee5b337b87
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41aa6569cfd60356084fac96a3feaf2834a02afdd7ba9f400fe3e929a32f04cd
|
| 3 |
+
size 24828348
|
clip/ocdbt.process_14/d/fedd638294aa456389cee462fcfa539e
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09e5711e8401127d4a6d42f0ecde0ed44bb2328e2f41d81dee51a38863e629ef
|
| 3 |
+
size 50822142
|
clip/ocdbt.process_14/manifest.ocdbt
ADDED
|
Binary file (184 Bytes). View file
|
|
|
clip/ocdbt.process_15/d/738ea6b2bc492be58942c98526816975
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b4c441f92b073f025588e56ebc933f9f3eda9cb80b7612aa9e77c57cf0069fcd
|
| 3 |
+
size 59077516
|
clip/ocdbt.process_15/d/d4533d57d4757deab44242019ed789d6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe6a12e2765d4b70b87c2051e19d6db73745035c09e406bd7fce0a138e119e02
|
| 3 |
+
size 16609115
|
clip/ocdbt.process_15/manifest.ocdbt
ADDED
|
Binary file (184 Bytes). View file
|
|
|
clip/ocdbt.process_2/d/5bb38d5ee9cabe414133589ceeeb5c1a
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed8f786e7c4caa4f4690b4ff2699d94f73d80e938c9c6cb4ceac4c43c4a211bc
|
| 3 |
+
size 37959216
|