Anonymous-Submission-830af commited on
Commit
b542727
·
verified ·
1 Parent(s): 0e82bb4

Upload folder using huggingface_hub

Browse files
Files changed (41) hide show
  1. .gitattributes +18 -0
  2. mp_causal_60000.pt/_CHECKPOINT_METADATA +1 -0
  3. mp_causal_60000.pt/_METADATA +1 -0
  4. mp_causal_60000.pt/_sharding +1 -0
  5. mp_causal_60000.pt/array_metadatas/process_0 +1 -0
  6. mp_causal_60000.pt/array_metadatas/process_1 +1 -0
  7. mp_causal_60000.pt/array_metadatas/process_2 +1 -0
  8. mp_causal_60000.pt/array_metadatas/process_3 +1 -0
  9. mp_causal_60000.pt/array_metadatas/process_4 +1 -0
  10. mp_causal_60000.pt/array_metadatas/process_5 +1 -0
  11. mp_causal_60000.pt/array_metadatas/process_6 +1 -0
  12. mp_causal_60000.pt/array_metadatas/process_7 +1 -0
  13. mp_causal_60000.pt/commit_success.txt +1 -0
  14. mp_causal_60000.pt/d/009656ae062ac3299a9aa0f0d609e4aa +3 -0
  15. mp_causal_60000.pt/manifest.ocdbt +0 -0
  16. mp_causal_60000.pt/ocdbt.process_0/d/3695460b7707a19f8f8eecb85bd97ab2 +3 -0
  17. mp_causal_60000.pt/ocdbt.process_0/d/417a017d285ccaa9531f43c034552e58 +0 -0
  18. mp_causal_60000.pt/ocdbt.process_0/d/5abdbd3f4919e95295173e494a934cbb +3 -0
  19. mp_causal_60000.pt/ocdbt.process_0/d/ab13a2e3a9a8f7101f3308d66a9d8952 +3 -0
  20. mp_causal_60000.pt/ocdbt.process_0/manifest.ocdbt +0 -0
  21. mp_causal_60000.pt/ocdbt.process_1/d/49765cb511d5a29ed37a4f1fef7718e6 +3 -0
  22. mp_causal_60000.pt/ocdbt.process_1/d/525417d8de2264a1cc2ceb60acb26ec5 +3 -0
  23. mp_causal_60000.pt/ocdbt.process_1/manifest.ocdbt +0 -0
  24. mp_causal_60000.pt/ocdbt.process_2/d/0be520c321a634b0ca6f4fe6bce8e891 +3 -0
  25. mp_causal_60000.pt/ocdbt.process_2/d/225c40b0464162d4d3665808d735893d +3 -0
  26. mp_causal_60000.pt/ocdbt.process_2/manifest.ocdbt +0 -0
  27. mp_causal_60000.pt/ocdbt.process_3/d/21c873b9a7006fb3b7b2a3345f2007dd +3 -0
  28. mp_causal_60000.pt/ocdbt.process_3/d/5fab00d2588cd26a1ec3265788f45294 +3 -0
  29. mp_causal_60000.pt/ocdbt.process_3/manifest.ocdbt +0 -0
  30. mp_causal_60000.pt/ocdbt.process_4/d/04bc0911120bfcb6658465a2768bb823 +3 -0
  31. mp_causal_60000.pt/ocdbt.process_4/d/160e82bbbfe8c7eb03559a914b57807f +3 -0
  32. mp_causal_60000.pt/ocdbt.process_4/manifest.ocdbt +0 -0
  33. mp_causal_60000.pt/ocdbt.process_5/d/0105ce032e58c01b1a87722da49cf075 +3 -0
  34. mp_causal_60000.pt/ocdbt.process_5/d/0d767211e01bd5107223d6ebb4b55e55 +3 -0
  35. mp_causal_60000.pt/ocdbt.process_5/manifest.ocdbt +0 -0
  36. mp_causal_60000.pt/ocdbt.process_6/d/322c3f14eefdd0d22a2b21107075a20e +3 -0
  37. mp_causal_60000.pt/ocdbt.process_6/d/c372ea76909d79ee62ec3a482a4b6865 +3 -0
  38. mp_causal_60000.pt/ocdbt.process_6/manifest.ocdbt +0 -0
  39. mp_causal_60000.pt/ocdbt.process_7/d/5bc6c9d3af5b0900c8806766c6192a53 +3 -0
  40. mp_causal_60000.pt/ocdbt.process_7/d/5e7e04aee528841d2f1b0d91d946db66 +3 -0
  41. mp_causal_60000.pt/ocdbt.process_7/manifest.ocdbt +0 -0
.gitattributes CHANGED
@@ -87,3 +87,21 @@ mp_bidirectional_120000.pt/ocdbt.process_6/d/974d2ea3375d4afae154bf234e6d932d fi
87
  mp_bidirectional_120000.pt/ocdbt.process_6/d/b977bce3e08f2761fa4cc115ac6bb22f filter=lfs diff=lfs merge=lfs -text
88
  mp_bidirectional_120000.pt/ocdbt.process_7/d/62ad7ede1673afd5972b964e1ffa65d3 filter=lfs diff=lfs merge=lfs -text
89
  mp_bidirectional_120000.pt/ocdbt.process_7/d/73d0a8ede0b8f4532bc44da8b166a2eb filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
87
  mp_bidirectional_120000.pt/ocdbt.process_6/d/b977bce3e08f2761fa4cc115ac6bb22f filter=lfs diff=lfs merge=lfs -text
88
  mp_bidirectional_120000.pt/ocdbt.process_7/d/62ad7ede1673afd5972b964e1ffa65d3 filter=lfs diff=lfs merge=lfs -text
89
  mp_bidirectional_120000.pt/ocdbt.process_7/d/73d0a8ede0b8f4532bc44da8b166a2eb filter=lfs diff=lfs merge=lfs -text
90
+ mp_causal_60000.pt/d/009656ae062ac3299a9aa0f0d609e4aa filter=lfs diff=lfs merge=lfs -text
91
+ mp_causal_60000.pt/ocdbt.process_0/d/3695460b7707a19f8f8eecb85bd97ab2 filter=lfs diff=lfs merge=lfs -text
92
+ mp_causal_60000.pt/ocdbt.process_0/d/5abdbd3f4919e95295173e494a934cbb filter=lfs diff=lfs merge=lfs -text
93
+ mp_causal_60000.pt/ocdbt.process_0/d/ab13a2e3a9a8f7101f3308d66a9d8952 filter=lfs diff=lfs merge=lfs -text
94
+ mp_causal_60000.pt/ocdbt.process_1/d/49765cb511d5a29ed37a4f1fef7718e6 filter=lfs diff=lfs merge=lfs -text
95
+ mp_causal_60000.pt/ocdbt.process_1/d/525417d8de2264a1cc2ceb60acb26ec5 filter=lfs diff=lfs merge=lfs -text
96
+ mp_causal_60000.pt/ocdbt.process_2/d/0be520c321a634b0ca6f4fe6bce8e891 filter=lfs diff=lfs merge=lfs -text
97
+ mp_causal_60000.pt/ocdbt.process_2/d/225c40b0464162d4d3665808d735893d filter=lfs diff=lfs merge=lfs -text
98
+ mp_causal_60000.pt/ocdbt.process_3/d/21c873b9a7006fb3b7b2a3345f2007dd filter=lfs diff=lfs merge=lfs -text
99
+ mp_causal_60000.pt/ocdbt.process_3/d/5fab00d2588cd26a1ec3265788f45294 filter=lfs diff=lfs merge=lfs -text
100
+ mp_causal_60000.pt/ocdbt.process_4/d/04bc0911120bfcb6658465a2768bb823 filter=lfs diff=lfs merge=lfs -text
101
+ mp_causal_60000.pt/ocdbt.process_4/d/160e82bbbfe8c7eb03559a914b57807f filter=lfs diff=lfs merge=lfs -text
102
+ mp_causal_60000.pt/ocdbt.process_5/d/0105ce032e58c01b1a87722da49cf075 filter=lfs diff=lfs merge=lfs -text
103
+ mp_causal_60000.pt/ocdbt.process_5/d/0d767211e01bd5107223d6ebb4b55e55 filter=lfs diff=lfs merge=lfs -text
104
+ mp_causal_60000.pt/ocdbt.process_6/d/322c3f14eefdd0d22a2b21107075a20e filter=lfs diff=lfs merge=lfs -text
105
+ mp_causal_60000.pt/ocdbt.process_6/d/c372ea76909d79ee62ec3a482a4b6865 filter=lfs diff=lfs merge=lfs -text
106
+ mp_causal_60000.pt/ocdbt.process_7/d/5bc6c9d3af5b0900c8806766c6192a53 filter=lfs diff=lfs merge=lfs -text
107
+ mp_causal_60000.pt/ocdbt.process_7/d/5e7e04aee528841d2f1b0d91d946db66 filter=lfs diff=lfs merge=lfs -text
mp_causal_60000.pt/_CHECKPOINT_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"item_handlers": "orbax.checkpoint._src.handlers.standard_checkpoint_handler.StandardCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1768927118604876117, "commit_timestamp_nsecs": 1768927136561342347, "custom_metadata": {}}
mp_causal_60000.pt/_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"tree_metadata": {"('blocks', 'action_model', 'img_attn_k_norm', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "img_attn_k_norm", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 2]}}, "('blocks', 'action_model', 'img_attn_q_norm', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "img_attn_q_norm", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 2]}}, "('blocks', 'action_model', 'key_attn_k_norm', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "key_attn_k_norm", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 2]}}, "('blocks', 'action_model', 'key_attn_q_norm', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "key_attn_q_norm", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 2]}}, "('blocks', 'action_model', 'keyboard_attn_kv', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "keyboard_attn_kv", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 2048]}}, "('blocks', 'action_model', 'keyboard_embed', 'layers', '0', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "keyboard_embed", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 4]}}, "('blocks', 'action_model', 'keyboard_embed', 'layers', '0', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "keyboard_embed", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 23, 4]}}, "('blocks', 'action_model', 'keyboard_embed', 'layers', '2', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "keyboard_embed", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 4]}}, "('blocks', 'action_model', 'keyboard_embed', 'layers', '2', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "keyboard_embed", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 4, 128]}}, "('blocks', 'action_model', 'mouse_attn_q', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_attn_q", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1024]}}, "('blocks', 'action_model', 'mouse_mlp', 'layers', '0', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_mlp", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32]}}, "('blocks', 'action_model', 'mouse_mlp', 'layers', '0', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_mlp", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 1560, 32]}}, "('blocks', 'action_model', 'mouse_mlp', 'layers', '2', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_mlp", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32]}}, "('blocks', 'action_model', 'mouse_mlp', 'layers', '2', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_mlp", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32, 1024]}}, "('blocks', 'action_model', 'mouse_mlp', 'layers', '3', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_mlp", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32]}}, "('blocks', 'action_model', 'mouse_mlp', 'layers', '3', 'scale', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "mouse_mlp", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32]}}, "('blocks', 'action_model', 'proj_keyboard', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "proj_keyboard", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32, 1536]}}, "('blocks', 'action_model', 'proj_mouse', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "proj_mouse", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32, 1536]}}, "('blocks', 'action_model', 't_qkv', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "action_model", "key_type": 2}, {"key": "t_qkv", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 32, 3072]}}, "('blocks', 'cross_attn', 'k', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'cross_attn', 'k', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'cross_attn', 'norm_k', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "norm_k", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'cross_attn', 'norm_q', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "norm_q", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'cross_attn', 'o', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'cross_attn', 'o', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'cross_attn', 'q', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'cross_attn', 'q', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'cross_attn', 'v', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'cross_attn', 'v', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "cross_attn", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'ffn', 'layers', '0', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "ffn", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 280]}}, "('blocks', 'ffn', 'layers', '0', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "ffn", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 8960]}}, "('blocks', 'ffn', 'layers', '2', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "ffn", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'ffn', 'layers', '2', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "ffn", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 280, 1536]}}, "('blocks', 'modulation', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "modulation", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 1, 6, 48]}}, "('blocks', 'norm3', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "norm3", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'norm3', 'scale', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "norm3", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'k', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'k', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'self_attn', 'norm_k', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "norm_k", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'norm_q', 'weight', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "norm_q", "key_type": 2}, {"key": "weight", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'o', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'o', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'self_attn', 'q', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'q', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('blocks', 'self_attn', 'v', 'bias', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48]}}, "('blocks', 'self_attn', 'v', 'kernel', 'value')": {"key_metadata": [{"key": "blocks", "key_type": 2}, {"key": "self_attn", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [30, 48, 1536]}}, "('head', 'head', 'bias', 'value')": {"key_metadata": [{"key": "head", "key_type": 2}, {"key": "head", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [2]}}, "('head', 'head', 'kernel', 'value')": {"key_metadata": [{"key": "head", "key_type": 2}, {"key": "head", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48, 64]}}, "('head', 'modulation', 'value')": {"key_metadata": [{"key": "head", "key_type": 2}, {"key": "modulation", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [1, 2, 48]}}, "('img_emb', 'proj', '0', 'bias', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [40]}}, "('img_emb', 'proj', '0', 'scale', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [40]}}, "('img_emb', 'proj', '1', 'bias', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [40]}}, "('img_emb', 'proj', '1', 'kernel', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [40, 1280]}}, "('img_emb', 'proj', '2', 'bias', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48]}}, "('img_emb', 'proj', '2', 'kernel', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [40, 1536]}}, "('img_emb', 'proj', '3', 'bias', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48]}}, "('img_emb', 'proj', '3', 'scale', 'value')": {"key_metadata": [{"key": "img_emb", "key_type": 2}, {"key": "proj", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48]}}, "('patch_embedding', 'bias', 'value')": {"key_metadata": [{"key": "patch_embedding", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48]}}, "('patch_embedding', 'kernel', 'value')": {"key_metadata": [{"key": "patch_embedding", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [1, 2, 2, 36, 48]}}, "('player_embed', 'embedding', 'value')": {"key_metadata": [{"key": "player_embed", "key_type": 2}, {"key": "embedding", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [2, 48]}}, "('time_embedding', 'layers', '0', 'bias', 'value')": {"key_metadata": [{"key": "time_embedding", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48]}}, "('time_embedding', 'layers', '0', 'kernel', 'value')": {"key_metadata": [{"key": "time_embedding", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [8, 1536]}}, "('time_embedding', 'layers', '2', 'bias', 'value')": {"key_metadata": [{"key": "time_embedding", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48]}}, "('time_embedding', 'layers', '2', 'kernel', 'value')": {"key_metadata": [{"key": "time_embedding", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48, 1536]}}, "('time_projection', 'layers', '1', 'bias', 'value')": {"key_metadata": [{"key": "time_projection", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [288]}}, "('time_projection', 'layers', '1', 'kernel', 'value')": {"key_metadata": [{"key": "time_projection", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [48, 9216]}}}, "use_zarr3": false, "store_array_data_equal_to_fill_value": true, "custom_metadata": null}
mp_causal_60000.pt/_sharding ADDED
@@ -0,0 +1 @@
 
 
1
+ {"YmxvY2tzLm1vZHVsYXRpb24udmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLm5vcm0zLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLm5vcm0zLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC50X3Frdi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5pbWdfYXR0bl9rX25vcm0ud2VpZ2h0LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5pbWdfYXR0bl9xX25vcm0ud2VpZ2h0LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlfYXR0bl9rX25vcm0ud2VpZ2h0LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlfYXR0bl9xX25vcm0ud2VpZ2h0LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlib2FyZF9hdHRuX2t2Lmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlib2FyZF9lbWJlZC5sYXllcnMuMC5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlib2FyZF9lbWJlZC5sYXllcnMuMC5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlib2FyZF9lbWJlZC5sYXllcnMuMi5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5rZXlib2FyZF9lbWJlZC5sYXllcnMuMi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9hdHRuX3Eua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9tbHAubGF5ZXJzLjAuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9tbHAubGF5ZXJzLjAua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9tbHAubGF5ZXJzLjIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9tbHAubGF5ZXJzLjIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9tbHAubGF5ZXJzLjMuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5tb3VzZV9tbHAubGF5ZXJzLjMuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5wcm9qX21vdXNlLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmFjdGlvbl9tb2RlbC5wcm9qX2tleWJvYXJkLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4uay5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4uay5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4ubm9ybV9rLndlaWdodC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4ubm9ybV9xLndlaWdodC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4uby5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4uby5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4ucS5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4ucS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4udi5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmNyb3NzX2F0dG4udi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmZmbi5sYXllcnMuMC5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmZmbi5sYXllcnMuMC5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, \"data\", null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmZmbi5sYXllcnMuMi5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLmZmbi5sYXllcnMuMi5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi52LmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi52Lmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5rLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5rLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5ub3JtX2sud2VpZ2h0LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5ub3JtX3Eud2VpZ2h0LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5vLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5vLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5xLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","YmxvY2tzLnNlbGZfYXR0bi5xLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aGVhZC5oZWFkLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aGVhZC5oZWFkLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aGVhZC5tb2R1bGF0aW9uLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjAuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjAuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjEuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjEua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjMuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","aW1nX2VtYi5wcm9qLjMuc2NhbGUudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","cGF0Y2hfZW1iZWRkaW5nLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","cGF0Y2hfZW1iZWRkaW5nLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null, null, null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","cGxheWVyX2VtYmVkLmVtYmVkZGluZy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","dGltZV9lbWJlZGRpbmcubGF5ZXJzLjAuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","dGltZV9lbWJlZGRpbmcubGF5ZXJzLjAua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","dGltZV9lbWJlZGRpbmcubGF5ZXJzLjIuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","dGltZV9lbWJlZGRpbmcubGF5ZXJzLjIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","dGltZV9wcm9qZWN0aW9uLmxheWVycy4xLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}","dGltZV9wcm9qZWN0aW9uLmxheWVycy4xLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [32], \"axis_names\": [\"data\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [{\"id\": 0}, {\"id\": 8}, {\"id\": 16}, {\"id\": 24}, {\"id\": 2}, {\"id\": 10}, {\"id\": 18}, {\"id\": 26}, {\"id\": 4}, {\"id\": 12}, {\"id\": 20}, {\"id\": 28}, {\"id\": 6}, {\"id\": 14}, {\"id\": 22}, {\"id\": 30}, {\"id\": 1}, {\"id\": 9}, {\"id\": 17}, {\"id\": 25}, {\"id\": 3}, {\"id\": 11}, {\"id\": 19}, {\"id\": 27}, {\"id\": 5}, {\"id\": 13}, {\"id\": 21}, {\"id\": 29}, {\"id\": 7}, {\"id\": 15}, {\"id\": 23}, {\"id\": 31}]}}"}
mp_causal_60000.pt/array_metadatas/process_0 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
mp_causal_60000.pt/array_metadatas/process_1 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
mp_causal_60000.pt/array_metadatas/process_2 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
mp_causal_60000.pt/array_metadatas/process_3 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
mp_causal_60000.pt/array_metadatas/process_4 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
mp_causal_60000.pt/array_metadatas/process_5 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
mp_causal_60000.pt/array_metadatas/process_6 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
mp_causal_60000.pt/array_metadatas/process_7 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "blocks.action_model.img_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.img_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_k_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.key_attn_q_norm.weight.value", "write_shape": [30, 2], "chunk_shape": [30, 2], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_attn_kv.kernel.value", "write_shape": [30, 48, 2048], "chunk_shape": [30, 48, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.0.kernel.value", "write_shape": [30, 23, 4], "chunk_shape": [30, 23, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.bias.value", "write_shape": [30, 4], "chunk_shape": [30, 4], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.keyboard_embed.layers.2.kernel.value", "write_shape": [30, 4, 128], "chunk_shape": [30, 4, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_attn_q.kernel.value", "write_shape": [30, 48, 1024], "chunk_shape": [30, 48, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.0.kernel.value", "write_shape": [30, 1560, 32], "chunk_shape": [30, 1560, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.2.kernel.value", "write_shape": [30, 32, 1024], "chunk_shape": [30, 32, 1024], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.bias.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.mouse_mlp.layers.3.scale.value", "write_shape": [30, 32], "chunk_shape": [30, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_keyboard.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.proj_mouse.kernel.value", "write_shape": [30, 32, 1536], "chunk_shape": [30, 32, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.action_model.t_qkv.kernel.value", "write_shape": [30, 32, 3072], "chunk_shape": [30, 32, 3072], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.cross_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.bias.value", "write_shape": [30, 280], "chunk_shape": [30, 280], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.0.kernel.value", "write_shape": [30, 48, 8960], "chunk_shape": [30, 48, 8960], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.ffn.layers.2.kernel.value", "write_shape": [30, 280, 1536], "chunk_shape": [30, 280, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.modulation.value", "write_shape": [30, 1, 6, 48], "chunk_shape": [30, 1, 6, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.norm3.scale.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.k.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_k.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.norm_q.weight.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.o.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.q.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.bias.value", "write_shape": [30, 48], "chunk_shape": [30, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "blocks.self_attn.v.kernel.value", "write_shape": [30, 48, 1536], "chunk_shape": [30, 48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.bias.value", "write_shape": [2], "chunk_shape": [2], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.head.kernel.value", "write_shape": [48, 64], "chunk_shape": [48, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "head.modulation.value", "write_shape": [1, 2, 48], "chunk_shape": [1, 2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.0.scale.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.bias.value", "write_shape": [40], "chunk_shape": [40], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.1.kernel.value", "write_shape": [40, 1280], "chunk_shape": [40, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.2.kernel.value", "write_shape": [40, 1536], "chunk_shape": [40, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "img_emb.proj.3.scale.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "patch_embedding.kernel.value", "write_shape": [1, 2, 2, 36, 48], "chunk_shape": [1, 2, 2, 36, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "player_embed.embedding.value", "write_shape": [2, 48], "chunk_shape": [2, 48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.0.kernel.value", "write_shape": [8, 1536], "chunk_shape": [8, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.bias.value", "write_shape": [48], "chunk_shape": [48], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_embedding.layers.2.kernel.value", "write_shape": [48, 1536], "chunk_shape": [48, 1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.bias.value", "write_shape": [288], "chunk_shape": [288], "ext_metadata": null}}, {"array_metadata": {"param_name": "time_projection.layers.1.kernel.value", "write_shape": [48, 9216], "chunk_shape": [48, 9216], "ext_metadata": null}}]}
mp_causal_60000.pt/commit_success.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ Checkpoint commit was successful to gs://solaris-east5/solaris/model/pretrained/v2_flagship_fix_bidirectional_causal_60000.pt
mp_causal_60000.pt/d/009656ae062ac3299a9aa0f0d609e4aa ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02d7447bad0c18a6d568011b800856902299d811f80b0de990e4e50b9c7f61e9
3
+ size 116307
mp_causal_60000.pt/manifest.ocdbt ADDED
Binary file (120 Bytes). View file
 
mp_causal_60000.pt/ocdbt.process_0/d/3695460b7707a19f8f8eecb85bd97ab2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac8e7966d275fb5f0f9c972b52326c8061c4c773ff724b7c5e6d0c3d4fd6b521
3
+ size 212370278
mp_causal_60000.pt/ocdbt.process_0/d/417a017d285ccaa9531f43c034552e58 ADDED
Binary file (277 Bytes). View file
 
mp_causal_60000.pt/ocdbt.process_0/d/5abdbd3f4919e95295173e494a934cbb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efcb6a27950449d68b2b02d988f81e0f2da836254982288a35cee56c600b9ff5
3
+ size 513400016
mp_causal_60000.pt/ocdbt.process_0/d/ab13a2e3a9a8f7101f3308d66a9d8952 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:574b86c86413a2c03345d0b5c00615861979d5d7f6ef61078325386c2b48a972
3
+ size 23301988
mp_causal_60000.pt/ocdbt.process_0/manifest.ocdbt ADDED
Binary file (264 Bytes). View file
 
mp_causal_60000.pt/ocdbt.process_1/d/49765cb511d5a29ed37a4f1fef7718e6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac8b7e827037d901c28d3b9f5ded953bb6b265a9df39eb658c1b0bdb45238725
3
+ size 382263820
mp_causal_60000.pt/ocdbt.process_1/d/525417d8de2264a1cc2ceb60acb26ec5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11baf290a2b0648ca71a4dded38a428bb9a1ed7d92f47f4badef2df7ef0d5f05
3
+ size 366856718
mp_causal_60000.pt/ocdbt.process_1/manifest.ocdbt ADDED
Binary file (184 Bytes). View file
 
mp_causal_60000.pt/ocdbt.process_2/d/0be520c321a634b0ca6f4fe6bce8e891 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b8dc489b4cc9d206a533591bc01e88b2e2b55856f0515eef3320bb31be0915e
3
+ size 382256745
mp_causal_60000.pt/ocdbt.process_2/d/225c40b0464162d4d3665808d735893d ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04929c8c58f69a214a0a15fa4b92e11d87807f8315fbc71e478209ed30174e39
3
+ size 366847454
mp_causal_60000.pt/ocdbt.process_2/manifest.ocdbt ADDED
Binary file (184 Bytes). View file
 
mp_causal_60000.pt/ocdbt.process_3/d/21c873b9a7006fb3b7b2a3345f2007dd ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dba9d56ccbb1971fe25108855e78fdeec0984bc20345d629d5f61d8e6561224a
3
+ size 334453584
mp_causal_60000.pt/ocdbt.process_3/d/5fab00d2588cd26a1ec3265788f45294 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99c1f6ac05b6cdb314aa4daf01469958605cd266444b8850328c65c3e906a0b2
3
+ size 414659137
mp_causal_60000.pt/ocdbt.process_3/manifest.ocdbt ADDED
Binary file (184 Bytes). View file
 
mp_causal_60000.pt/ocdbt.process_4/d/04bc0911120bfcb6658465a2768bb823 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5078f52bebf0ddd82eb72b7cd34dd0a8ebb2eb446661a6aa4f7412598b6e0b87
3
+ size 366859743
mp_causal_60000.pt/ocdbt.process_4/d/160e82bbbfe8c7eb03559a914b57807f ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:034b691dc67e519516398b88bde467508b610e4e09cfc20f2bc05e15f500fdbe
3
+ size 382290852
mp_causal_60000.pt/ocdbt.process_4/manifest.ocdbt ADDED
Binary file (184 Bytes). View file
 
mp_causal_60000.pt/ocdbt.process_5/d/0105ce032e58c01b1a87722da49cf075 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b090da15b3744119ad4842c0acf3133f1b753f42e103dbce925c23a43074457
3
+ size 184492463
mp_causal_60000.pt/ocdbt.process_5/d/0d767211e01bd5107223d6ebb4b55e55 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8c24e1e864f25f99d6bd23f2ef6039f949e3914ff5b3614934e9db3810dda5a
3
+ size 564591736
mp_causal_60000.pt/ocdbt.process_5/manifest.ocdbt ADDED
Binary file (181 Bytes). View file
 
mp_causal_60000.pt/ocdbt.process_6/d/322c3f14eefdd0d22a2b21107075a20e ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2a5206db4af5163487b58ff356ba71fcee74423f96c03df361c8bdc472eacc2
3
+ size 366836963
mp_causal_60000.pt/ocdbt.process_6/d/c372ea76909d79ee62ec3a482a4b6865 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b079c2d391beb29c30dcec6da3bfc221bdeeb9bcc0e97ef50da239b98f538b5
3
+ size 382266111
mp_causal_60000.pt/ocdbt.process_6/manifest.ocdbt ADDED
Binary file (184 Bytes). View file
 
mp_causal_60000.pt/ocdbt.process_7/d/5bc6c9d3af5b0900c8806766c6192a53 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed723a34d48a98a8797402a11324bb9acc9371f08cb16cc4574e0cf0ed11fd05
3
+ size 325895593
mp_causal_60000.pt/ocdbt.process_7/d/5e7e04aee528841d2f1b0d91d946db66 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:414f983eb2fb9808d89e9d87668a3569524efc4b2c024809380d792bf954d210
3
+ size 423201869
mp_causal_60000.pt/ocdbt.process_7/manifest.ocdbt ADDED
Binary file (183 Bytes). View file