Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +15 -0
- sft_ckpt/2572/_CHECKPOINT_METADATA +1 -0
- sft_ckpt/2572/model_params/_METADATA +0 -0
- sft_ckpt/2572/model_params/_sharding +1 -0
- sft_ckpt/2572/model_params/array_metadatas/process_0 +1 -0
- sft_ckpt/2572/model_params/d/5eeef6bccf874e48f4ea977dda491431 +0 -0
- sft_ckpt/2572/model_params/manifest.ocdbt +0 -0
- sft_ckpt/2572/model_params/ocdbt.process_0/d/290572c5d8678d3ea2d4e4b05461bebe +3 -0
- sft_ckpt/2572/model_params/ocdbt.process_0/d/2d8029e565e1c9ace8a78cc004c9a1f1 +3 -0
- sft_ckpt/2572/model_params/ocdbt.process_0/d/495ad0bab89cd857cee7eebb47a25202 +3 -0
- sft_ckpt/2572/model_params/ocdbt.process_0/d/914119694ed011bf405e78ae15e6089c +0 -0
- sft_ckpt/2572/model_params/ocdbt.process_0/d/b1e738f406479115242793b35ef3948f +0 -0
- sft_ckpt/2572/model_params/ocdbt.process_0/d/eb0574f1b718e3a72de00d309731f3be +0 -0
- sft_ckpt/2572/model_params/ocdbt.process_0/manifest.ocdbt +0 -0
- sft_ckpt/3883/_CHECKPOINT_METADATA +1 -0
- sft_ckpt/3883/model_params/_METADATA +0 -0
- sft_ckpt/3883/model_params/_sharding +1 -0
- sft_ckpt/3883/model_params/array_metadatas/process_0 +1 -0
- sft_ckpt/3883/model_params/d/945d9ee2b0628a3ca52543282ed39bd3 +0 -0
- sft_ckpt/3883/model_params/manifest.ocdbt +0 -0
- sft_ckpt/3883/model_params/ocdbt.process_0/d/30f1b983b274b82cc04996a796cd6a84 +3 -0
- sft_ckpt/3883/model_params/ocdbt.process_0/d/4ced86e6202e91a73ccea56b89caf26a +3 -0
- sft_ckpt/3883/model_params/ocdbt.process_0/d/5854a28beb465f0b3c62bf2d6ca4f6ae +3 -0
- sft_ckpt/3883/model_params/ocdbt.process_0/d/6a0822e5cf7854a94037f036a6e683bd +3 -0
- sft_ckpt/3883/model_params/ocdbt.process_0/d/9f6bd13ae6300be1a85e16c5adfcfc61 +0 -0
- sft_ckpt/3883/model_params/ocdbt.process_0/d/b31d82eeaf25575e688eeef907fe2c77 +0 -0
- sft_ckpt/3883/model_params/ocdbt.process_0/manifest.ocdbt +0 -0
- sft_ckpt/5000/_CHECKPOINT_METADATA +1 -0
- sft_ckpt/5000/model_params/_METADATA +0 -0
- sft_ckpt/5000/model_params/_sharding +1 -0
- sft_ckpt/5000/model_params/array_metadatas/process_0 +1 -0
- sft_ckpt/5000/model_params/d/c9caf11b5f29b8c2861e5ac1ef34bc04 +0 -0
- sft_ckpt/5000/model_params/manifest.ocdbt +0 -0
- sft_ckpt/5000/model_params/ocdbt.process_0/d/03006177174f19f3a92f0d5d97f8ed31 +3 -0
- sft_ckpt/5000/model_params/ocdbt.process_0/d/4e56edcead7ffd2d8b23bbb874557dbb +3 -0
- sft_ckpt/5000/model_params/ocdbt.process_0/d/51e04d30e831472d47c1fa4b5f389d8f +0 -0
- sft_ckpt/5000/model_params/ocdbt.process_0/d/6bf77ef2ee1f00ea5a87c9221dfcb748 +0 -0
- sft_ckpt/5000/model_params/ocdbt.process_0/d/d3cf8776c3cb51991b5e69c6e25b9f3f +3 -0
- sft_ckpt/5000/model_params/ocdbt.process_0/manifest.ocdbt +0 -0
- sft_ckpt/final/_CHECKPOINT_METADATA +1 -0
- sft_ckpt/final/_METADATA +0 -0
- sft_ckpt/final/_sharding +1 -0
- sft_ckpt/final/array_metadatas/process_0 +1 -0
- sft_ckpt/final/d/48deca6292cb97ba955456412dc30d00 +0 -0
- sft_ckpt/final/manifest.ocdbt +0 -0
- sft_ckpt/final/ocdbt.process_0/d/4a6d6fdddb293719dc805175d035be68 +3 -0
- sft_ckpt/final/ocdbt.process_0/d/86e0eb73f2e05e489be9db977b37c014 +3 -0
- sft_ckpt/final/ocdbt.process_0/d/9d9e4d3965b9c252af699486babacbc3 +3 -0
- sft_ckpt/final/ocdbt.process_0/d/9f03e1d63be7a07069a44caa9a02a442 +0 -0
- sft_ckpt/final/ocdbt.process_0/d/c05b0bf61423c90ccbfcd19c0ce8f33d +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,18 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
sft_ckpt/2572/model_params/ocdbt.process_0/d/290572c5d8678d3ea2d4e4b05461bebe filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
sft_ckpt/2572/model_params/ocdbt.process_0/d/2d8029e565e1c9ace8a78cc004c9a1f1 filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
sft_ckpt/2572/model_params/ocdbt.process_0/d/495ad0bab89cd857cee7eebb47a25202 filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
sft_ckpt/3883/model_params/ocdbt.process_0/d/30f1b983b274b82cc04996a796cd6a84 filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
sft_ckpt/3883/model_params/ocdbt.process_0/d/4ced86e6202e91a73ccea56b89caf26a filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
sft_ckpt/3883/model_params/ocdbt.process_0/d/5854a28beb465f0b3c62bf2d6ca4f6ae filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
sft_ckpt/3883/model_params/ocdbt.process_0/d/6a0822e5cf7854a94037f036a6e683bd filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
sft_ckpt/5000/model_params/ocdbt.process_0/d/03006177174f19f3a92f0d5d97f8ed31 filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
sft_ckpt/5000/model_params/ocdbt.process_0/d/4e56edcead7ffd2d8b23bbb874557dbb filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
sft_ckpt/5000/model_params/ocdbt.process_0/d/d3cf8776c3cb51991b5e69c6e25b9f3f filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
sft_ckpt/final/ocdbt.process_0/d/4a6d6fdddb293719dc805175d035be68 filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
sft_ckpt/final/ocdbt.process_0/d/86e0eb73f2e05e489be9db977b37c014 filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
sft_ckpt/final/ocdbt.process_0/d/9d9e4d3965b9c252af699486babacbc3 filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
sft_ckpt/final/ocdbt.process_0/d/c05b0bf61423c90ccbfcd19c0ce8f33d filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
sft_ckpt/final/ocdbt.process_0/d/d0a1561b0db1a073464552a6aad57757 filter=lfs diff=lfs merge=lfs -text
|
sft_ckpt/2572/_CHECKPOINT_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"item_handlers": {"model_params": "orbax.checkpoint._src.handlers.standard_checkpoint_handler.StandardCheckpointHandler"}, "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1768234005174125988, "commit_timestamp_nsecs": 1768234011473829769, "custom_metadata": {}}
|
sft_ckpt/2572/model_params/_METADATA
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
sft_ckpt/2572/model_params/_sharding
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}"}
|
sft_ckpt/2572/model_params/array_metadatas/process_0
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}]}
|
sft_ckpt/2572/model_params/d/5eeef6bccf874e48f4ea977dda491431
ADDED
|
Binary file (2.74 kB). View file
|
|
|
sft_ckpt/2572/model_params/manifest.ocdbt
ADDED
|
Binary file (117 Bytes). View file
|
|
|
sft_ckpt/2572/model_params/ocdbt.process_0/d/290572c5d8678d3ea2d4e4b05461bebe
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c98902db41419a26e5274e2964c6dff06e3a42589acb277c6fa56e0d6f5d9231
|
| 3 |
+
size 42545152
|
sft_ckpt/2572/model_params/ocdbt.process_0/d/2d8029e565e1c9ace8a78cc004c9a1f1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e8175d2d264c9ac606bd3d89c458c5566caa702688452bad5589c30f5d0c6c54
|
| 3 |
+
size 43208704
|
sft_ckpt/2572/model_params/ocdbt.process_0/d/495ad0bab89cd857cee7eebb47a25202
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9cf47d6494e3403493cc788145f3eaeb80b3ea43d1f54c0a503a590ed58c64b9
|
| 3 |
+
size 24338432
|
sft_ckpt/2572/model_params/ocdbt.process_0/d/914119694ed011bf405e78ae15e6089c
ADDED
|
Binary file (474 Bytes). View file
|
|
|
sft_ckpt/2572/model_params/ocdbt.process_0/d/b1e738f406479115242793b35ef3948f
ADDED
|
Binary file (479 Bytes). View file
|
|
|
sft_ckpt/2572/model_params/ocdbt.process_0/d/eb0574f1b718e3a72de00d309731f3be
ADDED
|
Binary file (206 Bytes). View file
|
|
|
sft_ckpt/2572/model_params/ocdbt.process_0/manifest.ocdbt
ADDED
|
Binary file (356 Bytes). View file
|
|
|
sft_ckpt/3883/_CHECKPOINT_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"item_handlers": {"model_params": "orbax.checkpoint._src.handlers.standard_checkpoint_handler.StandardCheckpointHandler"}, "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1768234185243970556, "commit_timestamp_nsecs": 1768234186243356788, "custom_metadata": {}}
|
sft_ckpt/3883/model_params/_METADATA
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
sft_ckpt/3883/model_params/_sharding
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}"}
|
sft_ckpt/3883/model_params/array_metadatas/process_0
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}]}
|
sft_ckpt/3883/model_params/d/945d9ee2b0628a3ca52543282ed39bd3
ADDED
|
Binary file (2.8 kB). View file
|
|
|
sft_ckpt/3883/model_params/manifest.ocdbt
ADDED
|
Binary file (117 Bytes). View file
|
|
|
sft_ckpt/3883/model_params/ocdbt.process_0/d/30f1b983b274b82cc04996a796cd6a84
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed6ce6d23108f1774c937d514dd56423eb25b1c683a9466247d53ae05cf43b31
|
| 3 |
+
size 43794432
|
sft_ckpt/3883/model_params/ocdbt.process_0/d/4ced86e6202e91a73ccea56b89caf26a
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92f0fec1874c9822d64c4339fe807fcab10b14f88b27b52be8c68d79c1d19bb4
|
| 3 |
+
size 46153728
|
sft_ckpt/3883/model_params/ocdbt.process_0/d/5854a28beb465f0b3c62bf2d6ca4f6ae
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0bb747661dc47281556e91232d54ee8d49d7654dd1e33e0baf5fede72573ad24
|
| 3 |
+
size 19259392
|
sft_ckpt/3883/model_params/ocdbt.process_0/d/6a0822e5cf7854a94037f036a6e683bd
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88a75029dcd7b6145661dec8bebd13bebea06d7f271f35e34083378e39564af7
|
| 3 |
+
size 1112839
|
sft_ckpt/3883/model_params/ocdbt.process_0/d/9f6bd13ae6300be1a85e16c5adfcfc61
ADDED
|
Binary file (452 Bytes). View file
|
|
|
sft_ckpt/3883/model_params/ocdbt.process_0/d/b31d82eeaf25575e688eeef907fe2c77
ADDED
|
Binary file (206 Bytes). View file
|
|
|
sft_ckpt/3883/model_params/ocdbt.process_0/manifest.ocdbt
ADDED
|
Binary file (367 Bytes). View file
|
|
|
sft_ckpt/5000/_CHECKPOINT_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"item_handlers": {"model_params": "orbax.checkpoint._src.handlers.standard_checkpoint_handler.StandardCheckpointHandler"}, "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1768234316590133098, "commit_timestamp_nsecs": 1768234317507606501, "custom_metadata": {}}
|
sft_ckpt/5000/model_params/_METADATA
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
sft_ckpt/5000/model_params/_sharding
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}"}
|
sft_ckpt/5000/model_params/array_metadatas/process_0
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}]}
|
sft_ckpt/5000/model_params/d/c9caf11b5f29b8c2861e5ac1ef34bc04
ADDED
|
Binary file (2.73 kB). View file
|
|
|
sft_ckpt/5000/model_params/manifest.ocdbt
ADDED
|
Binary file (117 Bytes). View file
|
|
|
sft_ckpt/5000/model_params/ocdbt.process_0/d/03006177174f19f3a92f0d5d97f8ed31
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1add560548ce632c7f28cf32104fa48576288a3695deddec81d89e5243fa2767
|
| 3 |
+
size 23289856
|
sft_ckpt/5000/model_params/ocdbt.process_0/d/4e56edcead7ffd2d8b23bbb874557dbb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03b6de97057df082db2428282da45fc206725228bef7312fd4b3153cbafaae1c
|
| 3 |
+
size 11644928
|
sft_ckpt/5000/model_params/ocdbt.process_0/d/51e04d30e831472d47c1fa4b5f389d8f
ADDED
|
Binary file (206 Bytes). View file
|
|
|
sft_ckpt/5000/model_params/ocdbt.process_0/d/6bf77ef2ee1f00ea5a87c9221dfcb748
ADDED
|
Binary file (464 Bytes). View file
|
|
|
sft_ckpt/5000/model_params/ocdbt.process_0/d/d3cf8776c3cb51991b5e69c6e25b9f3f
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3821f79c250ce901a2c15eacf5a94702ab4ae27f7b62839addca0783623b004e
|
| 3 |
+
size 75497472
|
sft_ckpt/5000/model_params/ocdbt.process_0/manifest.ocdbt
ADDED
|
Binary file (322 Bytes). View file
|
|
|
sft_ckpt/final/_CHECKPOINT_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"item_handlers": "orbax.checkpoint._src.handlers.standard_checkpoint_handler.StandardCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1768234317846803583, "commit_timestamp_nsecs": 1768234318780793646, "custom_metadata": {}}
|
sft_ckpt/final/_METADATA
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
sft_ckpt/final/_sharding
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}"}
|
sft_ckpt/final/array_metadatas/process_0
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}]}
|
sft_ckpt/final/d/48deca6292cb97ba955456412dc30d00
ADDED
|
Binary file (2.85 kB). View file
|
|
|
sft_ckpt/final/manifest.ocdbt
ADDED
|
Binary file (117 Bytes). View file
|
|
|
sft_ckpt/final/ocdbt.process_0/d/4a6d6fdddb293719dc805175d035be68
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90c111bcf3f2521835dc59cf77fa7e5ab26a57dc1224c43e143afe87f8195a57
|
| 3 |
+
size 6012928
|
sft_ckpt/final/ocdbt.process_0/d/86e0eb73f2e05e489be9db977b37c014
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6bb66222d7c519cf46308191bddd2e7e7c0f01ccfe5e215bc09a6f04c4d30ceb
|
| 3 |
+
size 452463
|
sft_ckpt/final/ocdbt.process_0/d/9d9e4d3965b9c252af699486babacbc3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e054764458a7e05b1a8eb82e71ffc8a4c56c646d8eb904252bf5be56eb8f19f1
|
| 3 |
+
size 19869696
|
sft_ckpt/final/ocdbt.process_0/d/9f03e1d63be7a07069a44caa9a02a442
ADDED
|
Binary file (474 Bytes). View file
|
|
|
sft_ckpt/final/ocdbt.process_0/d/c05b0bf61423c90ccbfcd19c0ce8f33d
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5eb6316b69ff53d675f416a44fc1a443ddf452eec377d1bbd079216c9c39aec4
|
| 3 |
+
size 73633792
|