Upload folder using huggingface_hub
Browse files- .gitattributes +18 -0
- mp_causal_60000.pt/_CHECKPOINT_METADATA +1 -0
- mp_causal_60000.pt/_METADATA +1 -0
- mp_causal_60000.pt/_sharding +1 -0
- mp_causal_60000.pt/array_metadatas/process_0 +1 -0
- mp_causal_60000.pt/array_metadatas/process_1 +1 -0
- mp_causal_60000.pt/array_metadatas/process_2 +1 -0
- mp_causal_60000.pt/array_metadatas/process_3 +1 -0
- mp_causal_60000.pt/array_metadatas/process_4 +1 -0
- mp_causal_60000.pt/array_metadatas/process_5 +1 -0
- mp_causal_60000.pt/array_metadatas/process_6 +1 -0
- mp_causal_60000.pt/array_metadatas/process_7 +1 -0
- mp_causal_60000.pt/commit_success.txt +1 -0
- mp_causal_60000.pt/d/009656ae062ac3299a9aa0f0d609e4aa +3 -0
- mp_causal_60000.pt/manifest.ocdbt +0 -0
- mp_causal_60000.pt/ocdbt.process_0/d/3695460b7707a19f8f8eecb85bd97ab2 +3 -0
- mp_causal_60000.pt/ocdbt.process_0/d/417a017d285ccaa9531f43c034552e58 +0 -0
- mp_causal_60000.pt/ocdbt.process_0/d/5abdbd3f4919e95295173e494a934cbb +3 -0
- mp_causal_60000.pt/ocdbt.process_0/d/ab13a2e3a9a8f7101f3308d66a9d8952 +3 -0
- mp_causal_60000.pt/ocdbt.process_0/manifest.ocdbt +0 -0
- mp_causal_60000.pt/ocdbt.process_1/d/49765cb511d5a29ed37a4f1fef7718e6 +3 -0
- mp_causal_60000.pt/ocdbt.process_1/d/525417d8de2264a1cc2ceb60acb26ec5 +3 -0
- mp_causal_60000.pt/ocdbt.process_1/manifest.ocdbt +0 -0
- mp_causal_60000.pt/ocdbt.process_2/d/0be520c321a634b0ca6f4fe6bce8e891 +3 -0
- mp_causal_60000.pt/ocdbt.process_2/d/225c40b0464162d4d3665808d735893d +3 -0
- mp_causal_60000.pt/ocdbt.process_2/manifest.ocdbt +0 -0
- mp_causal_60000.pt/ocdbt.process_3/d/21c873b9a7006fb3b7b2a3345f2007dd +3 -0
- mp_causal_60000.pt/ocdbt.process_3/d/5fab00d2588cd26a1ec3265788f45294 +3 -0
- mp_causal_60000.pt/ocdbt.process_3/manifest.ocdbt +0 -0
- mp_causal_60000.pt/ocdbt.process_4/d/04bc0911120bfcb6658465a2768bb823 +3 -0
- mp_causal_60000.pt/ocdbt.process_4/d/160e82bbbfe8c7eb03559a914b57807f +3 -0
- mp_causal_60000.pt/ocdbt.process_4/manifest.ocdbt +0 -0
- mp_causal_60000.pt/ocdbt.process_5/d/0105ce032e58c01b1a87722da49cf075 +3 -0
- mp_causal_60000.pt/ocdbt.process_5/d/0d767211e01bd5107223d6ebb4b55e55 +3 -0
- mp_causal_60000.pt/ocdbt.process_5/manifest.ocdbt +0 -0
- mp_causal_60000.pt/ocdbt.process_6/d/322c3f14eefdd0d22a2b21107075a20e +3 -0
- mp_causal_60000.pt/ocdbt.process_6/d/c372ea76909d79ee62ec3a482a4b6865 +3 -0
- mp_causal_60000.pt/ocdbt.process_6/manifest.ocdbt +0 -0
- mp_causal_60000.pt/ocdbt.process_7/d/5bc6c9d3af5b0900c8806766c6192a53 +3 -0
- mp_causal_60000.pt/ocdbt.process_7/d/5e7e04aee528841d2f1b0d91d946db66 +3 -0
- mp_causal_60000.pt/ocdbt.process_7/manifest.ocdbt +0 -0
.gitattributes
CHANGED
|
@@ -87,3 +87,21 @@ mp_bidirectional_120000.pt/ocdbt.process_6/d/974d2ea3375d4afae154bf234e6d932d fi
|
|
| 87 |
mp_bidirectional_120000.pt/ocdbt.process_6/d/b977bce3e08f2761fa4cc115ac6bb22f filter=lfs diff=lfs merge=lfs -text
|
| 88 |
mp_bidirectional_120000.pt/ocdbt.process_7/d/62ad7ede1673afd5972b964e1ffa65d3 filter=lfs diff=lfs merge=lfs -text
|
| 89 |
mp_bidirectional_120000.pt/ocdbt.process_7/d/73d0a8ede0b8f4532bc44da8b166a2eb filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 87 |
mp_bidirectional_120000.pt/ocdbt.process_6/d/b977bce3e08f2761fa4cc115ac6bb22f filter=lfs diff=lfs merge=lfs -text
|
| 88 |
mp_bidirectional_120000.pt/ocdbt.process_7/d/62ad7ede1673afd5972b964e1ffa65d3 filter=lfs diff=lfs merge=lfs -text
|
| 89 |
mp_bidirectional_120000.pt/ocdbt.process_7/d/73d0a8ede0b8f4532bc44da8b166a2eb filter=lfs diff=lfs merge=lfs -text
|
| 90 |
+
mp_causal_60000.pt/d/009656ae062ac3299a9aa0f0d609e4aa filter=lfs diff=lfs merge=lfs -text
|
| 91 |
+
mp_causal_60000.pt/ocdbt.process_0/d/3695460b7707a19f8f8eecb85bd97ab2 filter=lfs diff=lfs merge=lfs -text
|
| 92 |
+
mp_causal_60000.pt/ocdbt.process_0/d/5abdbd3f4919e95295173e494a934cbb filter=lfs diff=lfs merge=lfs -text
|
| 93 |
+
mp_causal_60000.pt/ocdbt.process_0/d/ab13a2e3a9a8f7101f3308d66a9d8952 filter=lfs diff=lfs merge=lfs -text
|
| 94 |
+
mp_causal_60000.pt/ocdbt.process_1/d/49765cb511d5a29ed37a4f1fef7718e6 filter=lfs diff=lfs merge=lfs -text
|
| 95 |
+
mp_causal_60000.pt/ocdbt.process_1/d/525417d8de2264a1cc2ceb60acb26ec5 filter=lfs diff=lfs merge=lfs -text
|
| 96 |
+
mp_causal_60000.pt/ocdbt.process_2/d/0be520c321a634b0ca6f4fe6bce8e891 filter=lfs diff=lfs merge=lfs -text
|
| 97 |
+
mp_causal_60000.pt/ocdbt.process_2/d/225c40b0464162d4d3665808d735893d filter=lfs diff=lfs merge=lfs -text
|
| 98 |
+
mp_causal_60000.pt/ocdbt.process_3/d/21c873b9a7006fb3b7b2a3345f2007dd filter=lfs diff=lfs merge=lfs -text
|
| 99 |
+
mp_causal_60000.pt/ocdbt.process_3/d/5fab00d2588cd26a1ec3265788f45294 filter=lfs diff=lfs merge=lfs -text
|
| 100 |
+
mp_causal_60000.pt/ocdbt.process_4/d/04bc0911120bfcb6658465a2768bb823 filter=lfs diff=lfs merge=lfs -text
|
| 101 |
+
mp_causal_60000.pt/ocdbt.process_4/d/160e82bbbfe8c7eb03559a914b57807f filter=lfs diff=lfs merge=lfs -text
|
| 102 |
+
mp_causal_60000.pt/ocdbt.process_5/d/0105ce032e58c01b1a87722da49cf075 filter=lfs diff=lfs merge=lfs -text
|
| 103 |
+
mp_causal_60000.pt/ocdbt.process_5/d/0d767211e01bd5107223d6ebb4b55e55 filter=lfs diff=lfs merge=lfs -text
|
| 104 |
+
mp_causal_60000.pt/ocdbt.process_6/d/322c3f14eefdd0d22a2b21107075a20e filter=lfs diff=lfs merge=lfs -text
|
| 105 |
+
mp_causal_60000.pt/ocdbt.process_6/d/c372ea76909d79ee62ec3a482a4b6865 filter=lfs diff=lfs merge=lfs -text
|
| 106 |
+
mp_causal_60000.pt/ocdbt.process_7/d/5bc6c9d3af5b0900c8806766c6192a53 filter=lfs diff=lfs merge=lfs -text
|
| 107 |
+
mp_causal_60000.pt/ocdbt.process_7/d/5e7e04aee528841d2f1b0d91d946db66 filter=lfs diff=lfs merge=lfs -text
|
mp_causal_60000.pt/_CHECKPOINT_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"item_handlers": "orbax.checkpoint._src.handlers.standard_checkpoint_handler.StandardCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1768927118604876117, "commit_timestamp_nsecs": 1768927136561342347, "custom_metadata": {}}
|
mp_causal_60000.pt/_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"tree_metadata": {"('blocks', 'action_model', 'img_attn_k_norm', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "img_attn_k_norm", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 2]}}, "('blocks', 'action_model', 'img_attn_q_norm', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "img_attn_q_norm", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 2]}}, "('blocks', 'action_model', 'key_attn_k_norm', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "key_attn_k_norm", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 2]}}, "('blocks', 'action_model', 'key_attn_q_norm', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "key_attn_q_norm", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 2]}}, "('blocks', 'action_model', 'keyboard_attn_kv', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "keyboard_attn_kv", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 2048]}}, "('blocks', 'action_model', 'keyboard_embed', 'layers', '0', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "keyboard_embed", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 4]}}, "('blocks', 'action_model', 'keyboard_embed', 'layers', '0', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "keyboard_embed", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 23, 4]}}, "('blocks', 'action_model', 'keyboard_embed', 'layers', '2', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "keyboard_embed", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 4]}}, "('blocks', 'action_model', 'keyboard_embed', 'layers', '2', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "keyboard_embed", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 4, 128]}}, "('blocks', 'action_model', 'mouse_attn_q', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_attn_q", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1024]}}, "('blocks', 'action_model', 'mouse_mlp', 'layers', '0', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_mlp", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32]}}, "('blocks', 'action_model', 'mouse_mlp', 'layers', '0', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_mlp", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 1560, 32]}}, "('blocks', 'action_model', 'mouse_mlp', 'layers', '2', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_mlp", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32]}}, "('blocks', 'action_model', 'mouse_mlp', 'layers', '2', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_mlp", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32, 1024]}}, "('blocks', 'action_model', 'mouse_mlp', 'layers', '3', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_mlp", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32]}}, "('blocks', 'action_model', 'mouse_mlp', 'layers', '3', 'scale', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_mlp", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32]}}, "('blocks', 'action_model', 'proj_keyboard', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "proj_keyboard", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32, 1536]}}, "('blocks', 'action_model', 'proj_mouse', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "proj_mouse", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32, 1536]}}, "('blocks', 'action_model', 't_qkv', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "t_qkv", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32, 3072]}}, "('blocks', 'cross_attn', 'k', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'cross_attn', 'k', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'cross_attn', 'norm_k', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "norm_k", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'cross_attn', 'norm_q', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "norm_q", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'cross_attn', 'o', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'cross_attn', 'o', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'cross_attn', 'q', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'cross_attn', 'q', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'cross_attn', 'v', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'cross_attn', 'v', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'ffn', 'layers', '0', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "ffn", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 280]}}, "('blocks', 'ffn', 'layers', '0', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "ffn", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 8960]}}, "('blocks', 'ffn', 'layers', '2', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "ffn", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'ffn', 'layers', '2', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "ffn", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 280, 1536]}}, "('blocks', 'modulation', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "modulation", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 1, 6, 48]}}, "('blocks', 'norm3', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "norm3", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'norm3', 'scale', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "norm3", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'k', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'k', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'self_attn', 'norm_k', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "norm_k", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'norm_q', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "norm_q", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'o', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'o', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'self_attn', 'q', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'q', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'self_attn', 'v', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'v', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('head', 'head', 'bias', 'value')": {"key_metadata": [{"key": "head", "key_type": 2}, {"key": "head", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [2]}}, "('head', 'head', 'kernel', 'value')": {"key_metadata": [{"key": "head", "key_type": 2}, {"key": "head", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48, 64]}}, "('head', 'modulation', 'value')": {"key_metadata": [{"key": "head", "key_type": 2}, {"key": "modulation", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [1, 2, 48]}}, "('img_emb', 'proj', '0', 'bias', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [40]}}, "('img_emb', 'proj', '0', 'scale', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [40]}}, "('img_emb', 'proj', '1', 'bias', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [40]}}, "('img_emb', 'proj', '1', 'kernel', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [40, 1280]}}, "('img_emb', 'proj', '2', 'bias', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48]}}, "('img_emb', 'proj', '2', 'kernel', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [40, 1536]}}, "('img_emb', 'proj', '3', 'bias', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48]}}, "('img_emb', 'proj', '3', 'scale', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48]}}, "('patch_embedding', 'bias', 'value')": {"key_metadata": [{"key": "patch_embedding", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48]}}, "('patch_embedding', 'kernel', 'value')": {"key_metadata": [{"key": "patch_embedding", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [1, 2, 2, 36, 48]}}, "('player_embed', 'embedding', 'value')": {"key_metadata": [{"key": "player_embed", "key_type": 2}, {"key": "embedding", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [2, 48]}}, "('time_embedding', 'layers', '0', 'bias', 'value')": {"key_metadata": [{"key": "time_embedding", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48]}}, "('time_embedding', 'layers', '0', 'kernel', 'value')": {"key_metadata": [{"key": "time_embedding", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [8, 1536]}}, "('time_embedding', 'layers', '2', 'bias', 'value')": {"key_metadata": [{"key": "time_embedding", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48]}}, "('time_embedding', 'layers', '2', 'kernel', 'value')": {"key_metadata": [{"key": "time_embedding", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48, 1536]}}, "('time_projection', 'layers', '1', 'bias', 'value')": {"key_metadata": [{"key": "time_projection", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [288]}}, "('time_projection', 'layers', '1', 'kernel', 'value')": {"key_metadata": [{"key": "time_projection", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48, 9216]}}}, "use_zarr3": false, "store_array_data_equal_to_fill_value": true, "custom_metadata": null}
|
mp_causal_60000.pt/_sharding
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"YmxvY2tzLm1vZHVsYXRpb24udmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLm5vcm0zLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLm5vcm0zLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC50X3Frdi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5pbWdfYXR0bl9rX25vcm0ud2VpZ2h0LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5pbWdfYXR0bl9xX25vcm0ud2VpZ2h0LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlfYXR0bl9rX25vcm0ud2VpZ2h0LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlfYXR0bl9xX25vcm0ud2VpZ2h0LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlib2FyZF9hdHRuX2t2Lmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlib2FyZF9lbWJlZC5sYXllcnMuMC5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlib2FyZF9lbWJlZC5sYXllcnMuMC5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlib2FyZF9lbWJlZC5sYXllcnMuMi5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlib2FyZF9lbWJlZC5sYXllcnMuMi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9hdHRuX3Eua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9tbHAubGF5ZXJzLjAuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9tbHAubGF5ZXJzLjAua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9tbHAubGF5ZXJzLjIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9tbHAubGF5ZXJzLjIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9tbHAubGF5ZXJzLjMuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9tbHAubGF5ZXJzLjMuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5wcm9qX21vdXNlLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5wcm9qX2tleWJvYXJkLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4uay5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4uay5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4ubm9ybV9rLndlaWdodC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4ubm9ybV9xLndlaWdodC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4uby5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4uby5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4ucS5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4ucS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4udi5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4udi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmZmbi5sYXllcnMuMC5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmZmbi5sYXllcnMuMC5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, \"data\", null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmZmbi5sYXllcnMuMi5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmZmbi5sYXllcnMuMi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi52LmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi52Lmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5rLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5rLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5ub3JtX2sud2VpZ2h0LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5ub3JtX3Eud2VpZ2h0LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5vLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5vLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5xLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5xLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aGVhZC5oZWFkLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aGVhZC5oZWFkLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aGVhZC5tb2R1bGF0aW9uLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjAuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjAuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjEua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjMuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjMuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","cGF0Y2hfZW1iZWRkaW5nLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","cGF0Y2hfZW1iZWRkaW5nLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","cGxheWVyX2VtYmVkLmVtYmVkZGluZy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","dGltZV9lbWJlZGRpbmcubGF5ZXJzLjAuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","dGltZV9lbWJlZGRpbmcubGF5ZXJzLjAua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","dGltZV9lbWJlZGRpbmcubGF5ZXJzLjIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","dGltZV9lbWJlZGRpbmcubGF5ZXJzLjIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","dGltZV9wcm9qZWN0aW9uLmxheWVycy4xLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","dGltZV9wcm9qZWN0aW9uLmxheWVycy4xLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}"}
|
mp_causal_60000.pt/array_metadatas/process_0
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
|
mp_causal_60000.pt/array_metadatas/process_1
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
|
mp_causal_60000.pt/array_metadatas/process_2
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
|
mp_causal_60000.pt/array_metadatas/process_3
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
|
mp_causal_60000.pt/array_metadatas/process_4
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
|
mp_causal_60000.pt/array_metadatas/process_5
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
|
mp_causal_60000.pt/array_metadatas/process_6
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
|
mp_causal_60000.pt/array_metadatas/process_7
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
|
mp_causal_60000.pt/commit_success.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
Checkpoint commit was successful to gs://solaris-east5/solaris/model/pretrained/v2_flagship_fix_bidirectional_causal_60000.pt
|
mp_causal_60000.pt/d/009656ae062ac3299a9aa0f0d609e4aa
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02d7447bad0c18a6d568011b800856902299d811f80b0de990e4e50b9c7f61e9
|
| 3 |
+
size 116307
|
mp_causal_60000.pt/manifest.ocdbt
ADDED
|
Binary file (120 Bytes). View file
|
|
|
mp_causal_60000.pt/ocdbt.process_0/d/3695460b7707a19f8f8eecb85bd97ab2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac8e7966d275fb5f0f9c972b52326c8061c4c773ff724b7c5e6d0c3d4fd6b521
|
| 3 |
+
size 212370278
|
mp_causal_60000.pt/ocdbt.process_0/d/417a017d285ccaa9531f43c034552e58
ADDED
|
Binary file (277 Bytes). View file
|
|
|
mp_causal_60000.pt/ocdbt.process_0/d/5abdbd3f4919e95295173e494a934cbb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:efcb6a27950449d68b2b02d988f81e0f2da836254982288a35cee56c600b9ff5
|
| 3 |
+
size 513400016
|
mp_causal_60000.pt/ocdbt.process_0/d/ab13a2e3a9a8f7101f3308d66a9d8952
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:574b86c86413a2c03345d0b5c00615861979d5d7f6ef61078325386c2b48a972
|
| 3 |
+
size 23301988
|
mp_causal_60000.pt/ocdbt.process_0/manifest.ocdbt
ADDED
|
Binary file (264 Bytes). View file
|
|
|
mp_causal_60000.pt/ocdbt.process_1/d/49765cb511d5a29ed37a4f1fef7718e6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac8b7e827037d901c28d3b9f5ded953bb6b265a9df39eb658c1b0bdb45238725
|
| 3 |
+
size 382263820
|
mp_causal_60000.pt/ocdbt.process_1/d/525417d8de2264a1cc2ceb60acb26ec5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11baf290a2b0648ca71a4dded38a428bb9a1ed7d92f47f4badef2df7ef0d5f05
|
| 3 |
+
size 366856718
|
mp_causal_60000.pt/ocdbt.process_1/manifest.ocdbt
ADDED
|
Binary file (184 Bytes). View file
|
|
|
mp_causal_60000.pt/ocdbt.process_2/d/0be520c321a634b0ca6f4fe6bce8e891
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b8dc489b4cc9d206a533591bc01e88b2e2b55856f0515eef3320bb31be0915e
|
| 3 |
+
size 382256745
|
mp_causal_60000.pt/ocdbt.process_2/d/225c40b0464162d4d3665808d735893d
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04929c8c58f69a214a0a15fa4b92e11d87807f8315fbc71e478209ed30174e39
|
| 3 |
+
size 366847454
|
mp_causal_60000.pt/ocdbt.process_2/manifest.ocdbt
ADDED
|
Binary file (184 Bytes). View file
|
|
|
mp_causal_60000.pt/ocdbt.process_3/d/21c873b9a7006fb3b7b2a3345f2007dd
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dba9d56ccbb1971fe25108855e78fdeec0984bc20345d629d5f61d8e6561224a
|
| 3 |
+
size 334453584
|
mp_causal_60000.pt/ocdbt.process_3/d/5fab00d2588cd26a1ec3265788f45294
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:99c1f6ac05b6cdb314aa4daf01469958605cd266444b8850328c65c3e906a0b2
|
| 3 |
+
size 414659137
|
mp_causal_60000.pt/ocdbt.process_3/manifest.ocdbt
ADDED
|
Binary file (184 Bytes). View file
|
|
|
mp_causal_60000.pt/ocdbt.process_4/d/04bc0911120bfcb6658465a2768bb823
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5078f52bebf0ddd82eb72b7cd34dd0a8ebb2eb446661a6aa4f7412598b6e0b87
|
| 3 |
+
size 366859743
|
mp_causal_60000.pt/ocdbt.process_4/d/160e82bbbfe8c7eb03559a914b57807f
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:034b691dc67e519516398b88bde467508b610e4e09cfc20f2bc05e15f500fdbe
|
| 3 |
+
size 382290852
|
mp_causal_60000.pt/ocdbt.process_4/manifest.ocdbt
ADDED
|
Binary file (184 Bytes). View file
|
|
|
mp_causal_60000.pt/ocdbt.process_5/d/0105ce032e58c01b1a87722da49cf075
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b090da15b3744119ad4842c0acf3133f1b753f42e103dbce925c23a43074457
|
| 3 |
+
size 184492463
|
mp_causal_60000.pt/ocdbt.process_5/d/0d767211e01bd5107223d6ebb4b55e55
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e8c24e1e864f25f99d6bd23f2ef6039f949e3914ff5b3614934e9db3810dda5a
|
| 3 |
+
size 564591736
|
mp_causal_60000.pt/ocdbt.process_5/manifest.ocdbt
ADDED
|
Binary file (181 Bytes). View file
|
|
|
mp_causal_60000.pt/ocdbt.process_6/d/322c3f14eefdd0d22a2b21107075a20e
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d2a5206db4af5163487b58ff356ba71fcee74423f96c03df361c8bdc472eacc2
|
| 3 |
+
size 366836963
|
mp_causal_60000.pt/ocdbt.process_6/d/c372ea76909d79ee62ec3a482a4b6865
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b079c2d391beb29c30dcec6da3bfc221bdeeb9bcc0e97ef50da239b98f538b5
|
| 3 |
+
size 382266111
|
mp_causal_60000.pt/ocdbt.process_6/manifest.ocdbt
ADDED
|
Binary file (184 Bytes). View file
|
|
|
mp_causal_60000.pt/ocdbt.process_7/d/5bc6c9d3af5b0900c8806766c6192a53
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed723a34d48a98a8797402a11324bb9acc9371f08cb16cc4574e0cf0ed11fd05
|
| 3 |
+
size 325895593
|
mp_causal_60000.pt/ocdbt.process_7/d/5e7e04aee528841d2f1b0d91d946db66
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:414f983eb2fb9808d89e9d87668a3569524efc4b2c024809380d792bf954d210
|
| 3 |
+
size 423201869
|
mp_causal_60000.pt/ocdbt.process_7/manifest.ocdbt
ADDED
|
Binary file (183 Bytes). View file
|
|
|