nanat05525 commited on
Commit
0373059
·
verified ·
1 Parent(s): 73017e5

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +15 -0
  2. sft_ckpt/2572/_CHECKPOINT_METADATA +1 -0
  3. sft_ckpt/2572/model_params/_METADATA +0 -0
  4. sft_ckpt/2572/model_params/_sharding +1 -0
  5. sft_ckpt/2572/model_params/array_metadatas/process_0 +1 -0
  6. sft_ckpt/2572/model_params/d/5eeef6bccf874e48f4ea977dda491431 +0 -0
  7. sft_ckpt/2572/model_params/manifest.ocdbt +0 -0
  8. sft_ckpt/2572/model_params/ocdbt.process_0/d/290572c5d8678d3ea2d4e4b05461bebe +3 -0
  9. sft_ckpt/2572/model_params/ocdbt.process_0/d/2d8029e565e1c9ace8a78cc004c9a1f1 +3 -0
  10. sft_ckpt/2572/model_params/ocdbt.process_0/d/495ad0bab89cd857cee7eebb47a25202 +3 -0
  11. sft_ckpt/2572/model_params/ocdbt.process_0/d/914119694ed011bf405e78ae15e6089c +0 -0
  12. sft_ckpt/2572/model_params/ocdbt.process_0/d/b1e738f406479115242793b35ef3948f +0 -0
  13. sft_ckpt/2572/model_params/ocdbt.process_0/d/eb0574f1b718e3a72de00d309731f3be +0 -0
  14. sft_ckpt/2572/model_params/ocdbt.process_0/manifest.ocdbt +0 -0
  15. sft_ckpt/3883/_CHECKPOINT_METADATA +1 -0
  16. sft_ckpt/3883/model_params/_METADATA +0 -0
  17. sft_ckpt/3883/model_params/_sharding +1 -0
  18. sft_ckpt/3883/model_params/array_metadatas/process_0 +1 -0
  19. sft_ckpt/3883/model_params/d/945d9ee2b0628a3ca52543282ed39bd3 +0 -0
  20. sft_ckpt/3883/model_params/manifest.ocdbt +0 -0
  21. sft_ckpt/3883/model_params/ocdbt.process_0/d/30f1b983b274b82cc04996a796cd6a84 +3 -0
  22. sft_ckpt/3883/model_params/ocdbt.process_0/d/4ced86e6202e91a73ccea56b89caf26a +3 -0
  23. sft_ckpt/3883/model_params/ocdbt.process_0/d/5854a28beb465f0b3c62bf2d6ca4f6ae +3 -0
  24. sft_ckpt/3883/model_params/ocdbt.process_0/d/6a0822e5cf7854a94037f036a6e683bd +3 -0
  25. sft_ckpt/3883/model_params/ocdbt.process_0/d/9f6bd13ae6300be1a85e16c5adfcfc61 +0 -0
  26. sft_ckpt/3883/model_params/ocdbt.process_0/d/b31d82eeaf25575e688eeef907fe2c77 +0 -0
  27. sft_ckpt/3883/model_params/ocdbt.process_0/manifest.ocdbt +0 -0
  28. sft_ckpt/5000/_CHECKPOINT_METADATA +1 -0
  29. sft_ckpt/5000/model_params/_METADATA +0 -0
  30. sft_ckpt/5000/model_params/_sharding +1 -0
  31. sft_ckpt/5000/model_params/array_metadatas/process_0 +1 -0
  32. sft_ckpt/5000/model_params/d/c9caf11b5f29b8c2861e5ac1ef34bc04 +0 -0
  33. sft_ckpt/5000/model_params/manifest.ocdbt +0 -0
  34. sft_ckpt/5000/model_params/ocdbt.process_0/d/03006177174f19f3a92f0d5d97f8ed31 +3 -0
  35. sft_ckpt/5000/model_params/ocdbt.process_0/d/4e56edcead7ffd2d8b23bbb874557dbb +3 -0
  36. sft_ckpt/5000/model_params/ocdbt.process_0/d/51e04d30e831472d47c1fa4b5f389d8f +0 -0
  37. sft_ckpt/5000/model_params/ocdbt.process_0/d/6bf77ef2ee1f00ea5a87c9221dfcb748 +0 -0
  38. sft_ckpt/5000/model_params/ocdbt.process_0/d/d3cf8776c3cb51991b5e69c6e25b9f3f +3 -0
  39. sft_ckpt/5000/model_params/ocdbt.process_0/manifest.ocdbt +0 -0
  40. sft_ckpt/final/_CHECKPOINT_METADATA +1 -0
  41. sft_ckpt/final/_METADATA +0 -0
  42. sft_ckpt/final/_sharding +1 -0
  43. sft_ckpt/final/array_metadatas/process_0 +1 -0
  44. sft_ckpt/final/d/48deca6292cb97ba955456412dc30d00 +0 -0
  45. sft_ckpt/final/manifest.ocdbt +0 -0
  46. sft_ckpt/final/ocdbt.process_0/d/4a6d6fdddb293719dc805175d035be68 +3 -0
  47. sft_ckpt/final/ocdbt.process_0/d/86e0eb73f2e05e489be9db977b37c014 +3 -0
  48. sft_ckpt/final/ocdbt.process_0/d/9d9e4d3965b9c252af699486babacbc3 +3 -0
  49. sft_ckpt/final/ocdbt.process_0/d/9f03e1d63be7a07069a44caa9a02a442 +0 -0
  50. sft_ckpt/final/ocdbt.process_0/d/c05b0bf61423c90ccbfcd19c0ce8f33d +3 -0
.gitattributes CHANGED
@@ -33,3 +33,18 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ sft_ckpt/2572/model_params/ocdbt.process_0/d/290572c5d8678d3ea2d4e4b05461bebe filter=lfs diff=lfs merge=lfs -text
37
+ sft_ckpt/2572/model_params/ocdbt.process_0/d/2d8029e565e1c9ace8a78cc004c9a1f1 filter=lfs diff=lfs merge=lfs -text
38
+ sft_ckpt/2572/model_params/ocdbt.process_0/d/495ad0bab89cd857cee7eebb47a25202 filter=lfs diff=lfs merge=lfs -text
39
+ sft_ckpt/3883/model_params/ocdbt.process_0/d/30f1b983b274b82cc04996a796cd6a84 filter=lfs diff=lfs merge=lfs -text
40
+ sft_ckpt/3883/model_params/ocdbt.process_0/d/4ced86e6202e91a73ccea56b89caf26a filter=lfs diff=lfs merge=lfs -text
41
+ sft_ckpt/3883/model_params/ocdbt.process_0/d/5854a28beb465f0b3c62bf2d6ca4f6ae filter=lfs diff=lfs merge=lfs -text
42
+ sft_ckpt/3883/model_params/ocdbt.process_0/d/6a0822e5cf7854a94037f036a6e683bd filter=lfs diff=lfs merge=lfs -text
43
+ sft_ckpt/5000/model_params/ocdbt.process_0/d/03006177174f19f3a92f0d5d97f8ed31 filter=lfs diff=lfs merge=lfs -text
44
+ sft_ckpt/5000/model_params/ocdbt.process_0/d/4e56edcead7ffd2d8b23bbb874557dbb filter=lfs diff=lfs merge=lfs -text
45
+ sft_ckpt/5000/model_params/ocdbt.process_0/d/d3cf8776c3cb51991b5e69c6e25b9f3f filter=lfs diff=lfs merge=lfs -text
46
+ sft_ckpt/final/ocdbt.process_0/d/4a6d6fdddb293719dc805175d035be68 filter=lfs diff=lfs merge=lfs -text
47
+ sft_ckpt/final/ocdbt.process_0/d/86e0eb73f2e05e489be9db977b37c014 filter=lfs diff=lfs merge=lfs -text
48
+ sft_ckpt/final/ocdbt.process_0/d/9d9e4d3965b9c252af699486babacbc3 filter=lfs diff=lfs merge=lfs -text
49
+ sft_ckpt/final/ocdbt.process_0/d/c05b0bf61423c90ccbfcd19c0ce8f33d filter=lfs diff=lfs merge=lfs -text
50
+ sft_ckpt/final/ocdbt.process_0/d/d0a1561b0db1a073464552a6aad57757 filter=lfs diff=lfs merge=lfs -text
sft_ckpt/2572/_CHECKPOINT_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"item_handlers": {"model_params": "orbax.checkpoint._src.handlers.standard_checkpoint_handler.StandardCheckpointHandler"}, "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1768234005174125988, "commit_timestamp_nsecs": 1768234011473829769, "custom_metadata": {}}
sft_ckpt/2572/model_params/_METADATA ADDED
The diff for this file is too large to render. See raw diff
 
sft_ckpt/2572/model_params/_sharding ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}"}
sft_ckpt/2572/model_params/array_metadatas/process_0 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}]}
sft_ckpt/2572/model_params/d/5eeef6bccf874e48f4ea977dda491431 ADDED
Binary file (2.74 kB). View file
 
sft_ckpt/2572/model_params/manifest.ocdbt ADDED
Binary file (117 Bytes). View file
 
sft_ckpt/2572/model_params/ocdbt.process_0/d/290572c5d8678d3ea2d4e4b05461bebe ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c98902db41419a26e5274e2964c6dff06e3a42589acb277c6fa56e0d6f5d9231
3
+ size 42545152
sft_ckpt/2572/model_params/ocdbt.process_0/d/2d8029e565e1c9ace8a78cc004c9a1f1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8175d2d264c9ac606bd3d89c458c5566caa702688452bad5589c30f5d0c6c54
3
+ size 43208704
sft_ckpt/2572/model_params/ocdbt.process_0/d/495ad0bab89cd857cee7eebb47a25202 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cf47d6494e3403493cc788145f3eaeb80b3ea43d1f54c0a503a590ed58c64b9
3
+ size 24338432
sft_ckpt/2572/model_params/ocdbt.process_0/d/914119694ed011bf405e78ae15e6089c ADDED
Binary file (474 Bytes). View file
 
sft_ckpt/2572/model_params/ocdbt.process_0/d/b1e738f406479115242793b35ef3948f ADDED
Binary file (479 Bytes). View file
 
sft_ckpt/2572/model_params/ocdbt.process_0/d/eb0574f1b718e3a72de00d309731f3be ADDED
Binary file (206 Bytes). View file
 
sft_ckpt/2572/model_params/ocdbt.process_0/manifest.ocdbt ADDED
Binary file (356 Bytes). View file
 
sft_ckpt/3883/_CHECKPOINT_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"item_handlers": {"model_params": "orbax.checkpoint._src.handlers.standard_checkpoint_handler.StandardCheckpointHandler"}, "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1768234185243970556, "commit_timestamp_nsecs": 1768234186243356788, "custom_metadata": {}}
sft_ckpt/3883/model_params/_METADATA ADDED
The diff for this file is too large to render. See raw diff
 
sft_ckpt/3883/model_params/_sharding ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}"}
sft_ckpt/3883/model_params/array_metadatas/process_0 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}]}
sft_ckpt/3883/model_params/d/945d9ee2b0628a3ca52543282ed39bd3 ADDED
Binary file (2.8 kB). View file
 
sft_ckpt/3883/model_params/manifest.ocdbt ADDED
Binary file (117 Bytes). View file
 
sft_ckpt/3883/model_params/ocdbt.process_0/d/30f1b983b274b82cc04996a796cd6a84 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed6ce6d23108f1774c937d514dd56423eb25b1c683a9466247d53ae05cf43b31
3
+ size 43794432
sft_ckpt/3883/model_params/ocdbt.process_0/d/4ced86e6202e91a73ccea56b89caf26a ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92f0fec1874c9822d64c4339fe807fcab10b14f88b27b52be8c68d79c1d19bb4
3
+ size 46153728
sft_ckpt/3883/model_params/ocdbt.process_0/d/5854a28beb465f0b3c62bf2d6ca4f6ae ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bb747661dc47281556e91232d54ee8d49d7654dd1e33e0baf5fede72573ad24
3
+ size 19259392
sft_ckpt/3883/model_params/ocdbt.process_0/d/6a0822e5cf7854a94037f036a6e683bd ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88a75029dcd7b6145661dec8bebd13bebea06d7f271f35e34083378e39564af7
3
+ size 1112839
sft_ckpt/3883/model_params/ocdbt.process_0/d/9f6bd13ae6300be1a85e16c5adfcfc61 ADDED
Binary file (452 Bytes). View file
 
sft_ckpt/3883/model_params/ocdbt.process_0/d/b31d82eeaf25575e688eeef907fe2c77 ADDED
Binary file (206 Bytes). View file
 
sft_ckpt/3883/model_params/ocdbt.process_0/manifest.ocdbt ADDED
Binary file (367 Bytes). View file
 
sft_ckpt/5000/_CHECKPOINT_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"item_handlers": {"model_params": "orbax.checkpoint._src.handlers.standard_checkpoint_handler.StandardCheckpointHandler"}, "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1768234316590133098, "commit_timestamp_nsecs": 1768234317507606501, "custom_metadata": {}}
sft_ckpt/5000/model_params/_METADATA ADDED
The diff for this file is too large to render. See raw diff
 
sft_ckpt/5000/model_params/_sharding ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}"}
sft_ckpt/5000/model_params/array_metadatas/process_0 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}]}
sft_ckpt/5000/model_params/d/c9caf11b5f29b8c2861e5ac1ef34bc04 ADDED
Binary file (2.73 kB). View file
 
sft_ckpt/5000/model_params/manifest.ocdbt ADDED
Binary file (117 Bytes). View file
 
sft_ckpt/5000/model_params/ocdbt.process_0/d/03006177174f19f3a92f0d5d97f8ed31 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1add560548ce632c7f28cf32104fa48576288a3695deddec81d89e5243fa2767
3
+ size 23289856
sft_ckpt/5000/model_params/ocdbt.process_0/d/4e56edcead7ffd2d8b23bbb874557dbb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03b6de97057df082db2428282da45fc206725228bef7312fd4b3153cbafaae1c
3
+ size 11644928
sft_ckpt/5000/model_params/ocdbt.process_0/d/51e04d30e831472d47c1fa4b5f389d8f ADDED
Binary file (206 Bytes). View file
 
sft_ckpt/5000/model_params/ocdbt.process_0/d/6bf77ef2ee1f00ea5a87c9221dfcb748 ADDED
Binary file (464 Bytes). View file
 
sft_ckpt/5000/model_params/ocdbt.process_0/d/d3cf8776c3cb51991b5e69c6e25b9f3f ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3821f79c250ce901a2c15eacf5a94702ab4ae27f7b62839addca0783623b004e
3
+ size 75497472
sft_ckpt/5000/model_params/ocdbt.process_0/manifest.ocdbt ADDED
Binary file (322 Bytes). View file
 
sft_ckpt/final/_CHECKPOINT_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"item_handlers": "orbax.checkpoint._src.handlers.standard_checkpoint_handler.StandardCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1768234317846803583, "commit_timestamp_nsecs": 1768234318780793646, "custom_metadata": {}}
sft_ckpt/final/_METADATA ADDED
The diff for this file is too large to render. See raw diff
 
sft_ckpt/final/_sharding ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjAubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE2LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE3LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE4LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjE5LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjExLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjEzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI0LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1Lm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjI1LmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIwLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIxLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIyLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC51cF9wcm9qLmtlcm5lbF9sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5kb3duX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLm1scC5nYXRlX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ua3ZfZWluc3VtLndfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjIzLmF0dG4ucV9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjMubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjQubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjUubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjYubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjcubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjguYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjgubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2EudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5rdl9laW5zdW0ud19sb3JhX2IudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkuYXR0bi5xX2VpbnN1bS53X2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmRvd25fcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9hLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLmdhdGVfcHJvai5rZXJuZWxfbG9yYV9iLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}","bGF5ZXJzLjkubWxwLnVwX3Byb2oua2VybmVsX2xvcmFfYi52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 1], \"axis_names\": [\"fsdp\", \"tp\"], \"axis_types\": [\"AxisType.Auto\", \"AxisType.Auto\"], \"partition_spec\": [\"tp\", \"fsdp\"], \"device_mesh\": {\"mesh\": [[{\"id\": 0}]]}}"}
sft_ckpt/final/array_metadatas/process_0 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.0.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.1.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.2.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.3.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.4.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.5.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.6.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.7.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.8.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.9.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.10.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.11.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.12.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.13.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.14.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.15.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.16.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.17.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.18.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.19.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.20.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.21.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.22.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.23.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.24.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.kv_einsum.w_lora_b.value", "write_shape": [64, 2, 4, 256], "chunk_shape": [64, 2, 4, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.attn.q_einsum.w_lora_b.value", "write_shape": [64, 8, 256], "chunk_shape": [64, 8, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_a.value", "write_shape": [9216, 64], "chunk_shape": [9216, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.down_proj.kernel_lora_b.value", "write_shape": [64, 2304], "chunk_shape": [64, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.gate_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_a.value", "write_shape": [2304, 64], "chunk_shape": [2304, 64], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers.25.mlp.up_proj.kernel_lora_b.value", "write_shape": [64, 9216], "chunk_shape": [64, 9216], "ext_metadata": null}}]}
sft_ckpt/final/d/48deca6292cb97ba955456412dc30d00 ADDED
Binary file (2.85 kB). View file
 
sft_ckpt/final/manifest.ocdbt ADDED
Binary file (117 Bytes). View file
 
sft_ckpt/final/ocdbt.process_0/d/4a6d6fdddb293719dc805175d035be68 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90c111bcf3f2521835dc59cf77fa7e5ab26a57dc1224c43e143afe87f8195a57
3
+ size 6012928
sft_ckpt/final/ocdbt.process_0/d/86e0eb73f2e05e489be9db977b37c014 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bb66222d7c519cf46308191bddd2e7e7c0f01ccfe5e215bc09a6f04c4d30ceb
3
+ size 452463
sft_ckpt/final/ocdbt.process_0/d/9d9e4d3965b9c252af699486babacbc3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e054764458a7e05b1a8eb82e71ffc8a4c56c646d8eb904252bf5be56eb8f19f1
3
+ size 19869696
sft_ckpt/final/ocdbt.process_0/d/9f03e1d63be7a07069a44caa9a02a442 ADDED
Binary file (474 Bytes). View file
 
sft_ckpt/final/ocdbt.process_0/d/c05b0bf61423c90ccbfcd19c0ce8f33d ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eb6316b69ff53d675f416a44fc1a443ddf452eec377d1bbd079216c9c39aec4
3
+ size 73633792