clockwork7 commited on
Commit
279317f
·
verified ·
1 Parent(s): 3c0a33f

Upload folder using huggingface_hub

Browse files
Files changed (49) hide show
  1. .gitattributes +2 -0
  2. checkpoint_699/_CHECKPOINT_METADATA +1 -0
  3. checkpoint_699/_METADATA +0 -0
  4. checkpoint_699/_sharding +1 -0
  5. checkpoint_699/array_metadatas/process_0 +1 -0
  6. checkpoint_699/config.json +30 -0
  7. checkpoint_699/d/67b79e4fe6de42df91d9d08953c075a2 +0 -0
  8. checkpoint_699/flax_model.msgpack +3 -0
  9. checkpoint_699/generation_config.json +6 -0
  10. checkpoint_699/manifest.ocdbt +0 -0
  11. checkpoint_699/ocdbt.process_0/d/0b40c133e9305812cc742f60d8a73010 +0 -0
  12. checkpoint_699/ocdbt.process_0/d/12a84b9891bdce7f46e339d70ad78e35 +0 -0
  13. checkpoint_699/ocdbt.process_0/d/27257186844697c506798cd6e8f4712d +0 -0
  14. checkpoint_699/ocdbt.process_0/d/344efdaaa2958060c8d0ed5fabd9bcd8 +3 -0
  15. checkpoint_699/ocdbt.process_0/d/3c843e166b3e122cc85abc7bc73f8ca8 +0 -0
  16. checkpoint_699/ocdbt.process_0/d/4104bb52016845f085d7921f84c21d44 +0 -0
  17. checkpoint_699/ocdbt.process_0/d/45a9f77615c7713cdf951285c64524af +0 -0
  18. checkpoint_699/ocdbt.process_0/d/4e6c5352b3d2690e14ada02bda8d1037 +0 -0
  19. checkpoint_699/ocdbt.process_0/d/5191648a34f198e3ea22153c72696b93 +0 -0
  20. checkpoint_699/ocdbt.process_0/d/547e1b94e62a7b55e5225de962e03b16 +0 -0
  21. checkpoint_699/ocdbt.process_0/d/591c649b2e8d5670a811253b19a9c69e +0 -0
  22. checkpoint_699/ocdbt.process_0/d/5fadb0ed8cb6769d5123f852c5d05347 +0 -0
  23. checkpoint_699/ocdbt.process_0/d/6555211bf5279b8bdf4122ff8077aa4d +0 -0
  24. checkpoint_699/ocdbt.process_0/d/66352f50d3244947724f80c4639547ab +0 -0
  25. checkpoint_699/ocdbt.process_0/d/6a05da5af6d4aaadc903363c07132161 +0 -0
  26. checkpoint_699/ocdbt.process_0/d/70c24c1e5e3f8cc706784876be0c3433 +0 -0
  27. checkpoint_699/ocdbt.process_0/d/77e9c5d9683b1df3273be5356706a413 +0 -0
  28. checkpoint_699/ocdbt.process_0/d/8419f3a30b4e21dc95624fc60c6916fd +0 -0
  29. checkpoint_699/ocdbt.process_0/d/8b225223672fc8b9b15a05c1ff22b74b +0 -0
  30. checkpoint_699/ocdbt.process_0/d/91ab0ce968af08a2ee6f52e6ad98c6e5 +3 -0
  31. checkpoint_699/ocdbt.process_0/d/91f361b086f378ad2c6123141f66556d +0 -0
  32. checkpoint_699/ocdbt.process_0/d/9911b0d501475ff605147cef11006a03 +0 -0
  33. checkpoint_699/ocdbt.process_0/d/9cadda087dea1c5d5b67be9d039bff49 +0 -0
  34. checkpoint_699/ocdbt.process_0/d/a2e9005c23bf8a4f418460bded2cabb4 +0 -0
  35. checkpoint_699/ocdbt.process_0/d/a4401d680a0686aafaad9a76ce11c54d +0 -0
  36. checkpoint_699/ocdbt.process_0/d/a44d962c52cdeaa1c19d6b8a205bf3aa +0 -0
  37. checkpoint_699/ocdbt.process_0/d/ac144fd63f453f7b7df71a0721d82ab7 +0 -0
  38. checkpoint_699/ocdbt.process_0/d/b00873e82df5877a979db1f44e6330f4 +0 -0
  39. checkpoint_699/ocdbt.process_0/d/ba273621627b4079fa41a94a4ba5f6f6 +0 -0
  40. checkpoint_699/ocdbt.process_0/d/bc2a08547865130a383e508235349b7f +0 -0
  41. checkpoint_699/ocdbt.process_0/d/c1fbdc67d9d2df8e978a49eb6fe63261 +0 -0
  42. checkpoint_699/ocdbt.process_0/d/cfd40bf4cc2e4c47e7cec089a8d2c65c +0 -0
  43. checkpoint_699/ocdbt.process_0/d/da7a968977d95d0c46a56873e52e3e05 +0 -0
  44. checkpoint_699/ocdbt.process_0/d/e5cb30c7f58f0a13efb550c310dd4b0f +0 -0
  45. checkpoint_699/ocdbt.process_0/d/efae6cf5b45a30312b6bfa9447b1d8eb +0 -0
  46. checkpoint_699/ocdbt.process_0/d/f2805f2712de39a8d2d6095c9d0a8da0 +0 -0
  47. checkpoint_699/ocdbt.process_0/d/faea7553e0ae9a161834568ad2a5b6c3 +0 -0
  48. checkpoint_699/ocdbt.process_0/d/ffc5d50bd91e5fc49fd0377f70d1a94e +0 -0
  49. checkpoint_699/ocdbt.process_0/manifest.ocdbt +0 -0
.gitattributes CHANGED
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ checkpoint_699/ocdbt.process_0/d/344efdaaa2958060c8d0ed5fabd9bcd8 filter=lfs diff=lfs merge=lfs -text
37
+ checkpoint_699/ocdbt.process_0/d/91ab0ce968af08a2ee6f52e6ad98c6e5 filter=lfs diff=lfs merge=lfs -text
checkpoint_699/_CHECKPOINT_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"item_handlers": "orbax.checkpoint._src.handlers.pytree_checkpoint_handler.PyTreeCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1743834704876500485, "commit_timestamp_nsecs": 1743834705379966406, "custom_metadata": {}}
checkpoint_699/_METADATA ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint_699/_sharding ADDED
@@ -0,0 +1 @@
 
 
1
+ {"ZHJvcG91dF9ybmc=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAuY291bnQ=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC40Lm1scC5jX2ZjLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC40Lm1scC5jX2ZjLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC40Lm1scC5jX3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC40Lm1scC5jX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC40LmF0dG4uY19hdHRuLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC40LmF0dG4uY19hdHRuLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC40LmF0dG4uY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC40LmF0dG4uY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC40LmxuXzEuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC40LmxuXzEuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC40LmxuXzIuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC40LmxuXzIuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC41Lm1scC5jX2ZjLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC41Lm1scC5jX2ZjLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC41Lm1scC5jX3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC41Lm1scC5jX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC41LmF0dG4uY19hdHRuLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC41LmF0dG4uY19hdHRuLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC41LmF0dG4uY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC41LmF0dG4uY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC41LmxuXzEuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC41LmxuXzEuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC41LmxuXzIuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC41LmxuXzIuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4wLm1scC5jX2ZjLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4wLm1scC5jX2ZjLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4wLm1scC5jX3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4wLm1scC5jX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4wLmF0dG4uY19hdHRuLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4wLmF0dG4uY19hdHRuLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4wLmF0dG4uY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4wLmF0dG4uY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4wLmxuXzEuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4wLmxuXzEuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4wLmxuXzIuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4wLmxuXzIuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4xLm1scC5jX2ZjLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4xLm1scC5jX2ZjLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4xLm1scC5jX3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4xLm1scC5jX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4xLmF0dG4uY19hdHRuLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4xLmF0dG4uY19hdHRuLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4xLmF0dG4uY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4xLmF0dG4uY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4xLmxuXzEuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4xLmxuXzEuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4xLmxuXzIuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4xLmxuXzIuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4yLm1scC5jX2ZjLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4yLm1scC5jX2ZjLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4yLm1scC5jX3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4yLm1scC5jX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4yLmF0dG4uY19hdHRuLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4yLmF0dG4uY19hdHRuLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4yLmF0dG4uY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4yLmF0dG4uY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4yLmxuXzEuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4yLmxuXzEuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4yLmxuXzIuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4yLmxuXzIuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4zLm1scC5jX2ZjLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4zLm1scC5jX2ZjLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4zLm1scC5jX3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4zLm1scC5jX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4zLmF0dG4uY19hdHRuLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4zLmF0dG4uY19hdHRuLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4zLmF0dG4uY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4zLmF0dG4uY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4zLmxuXzEuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4zLmxuXzEuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4zLmxuXzIuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIuaC4zLmxuXzIuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIubG5fZi5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIubG5fZi5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIud3BlLmVtYmVkZGluZw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubXUudHJhbnNmb3JtZXIud3RlLmVtYmVkZGluZw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC40Lm1scC5jX2ZjLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC40Lm1scC5jX2ZjLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC40Lm1scC5jX3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC40Lm1scC5jX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC40LmF0dG4uY19hdHRuLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC40LmF0dG4uY19hdHRuLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC40LmF0dG4uY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC40LmF0dG4uY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC40LmxuXzEuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC40LmxuXzEuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC40LmxuXzIuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC40LmxuXzIuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC41Lm1scC5jX2ZjLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC41Lm1scC5jX2ZjLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC41Lm1scC5jX3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC41Lm1scC5jX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC41LmF0dG4uY19hdHRuLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC41LmF0dG4uY19hdHRuLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC41LmF0dG4uY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC41LmF0dG4uY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC41LmxuXzEuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC41LmxuXzEuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC41LmxuXzIuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC41LmxuXzIuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4wLm1scC5jX2ZjLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4wLm1scC5jX2ZjLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4wLm1scC5jX3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4wLm1scC5jX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4wLmF0dG4uY19hdHRuLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4wLmF0dG4uY19hdHRuLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4wLmF0dG4uY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4wLmF0dG4uY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4wLmxuXzEuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4wLmxuXzEuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4wLmxuXzIuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4wLmxuXzIuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4xLm1scC5jX2ZjLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4xLm1scC5jX2ZjLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4xLm1scC5jX3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4xLm1scC5jX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4xLmF0dG4uY19hdHRuLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4xLmF0dG4uY19hdHRuLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4xLmF0dG4uY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4xLmF0dG4uY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4xLmxuXzEuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4xLmxuXzEuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4xLmxuXzIuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4xLmxuXzIuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4yLm1scC5jX2ZjLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4yLm1scC5jX2ZjLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4yLm1scC5jX3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4yLm1scC5jX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4yLmF0dG4uY19hdHRuLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4yLmF0dG4uY19hdHRuLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4yLmF0dG4uY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4yLmF0dG4uY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4yLmxuXzEuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4yLmxuXzEuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4yLmxuXzIuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4yLmxuXzIuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4zLm1scC5jX2ZjLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4zLm1scC5jX2ZjLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4zLm1scC5jX3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4zLm1scC5jX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4zLmF0dG4uY19hdHRuLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4zLmF0dG4uY19hdHRuLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4zLmF0dG4uY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4zLmF0dG4uY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4zLmxuXzEuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4zLmxuXzEuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4zLmxuXzIuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIuaC4zLmxuXzIuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIubG5fZi5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIubG5fZi5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIud3BlLmVtYmVkZGluZw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjAubnUudHJhbnNmb3JtZXIud3RlLmVtYmVkZGluZw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","b3B0X3N0YXRlLjIuY291bnQ=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","c3RlcA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMC5hdHRuLmNfYXR0bi5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMC5hdHRuLmNfYXR0bi5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMC5hdHRuLmNfcHJvai5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMC5hdHRuLmNfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMC5sbl8xLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMC5sbl8xLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMC5sbl8yLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMC5sbl8yLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMC5tbHAuY19mYy5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMC5tbHAuY19mYy5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMC5tbHAuY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMC5tbHAuY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMS5hdHRuLmNfYXR0bi5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMS5hdHRuLmNfYXR0bi5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMS5hdHRuLmNfcHJvai5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMS5hdHRuLmNfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMS5sbl8xLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMS5sbl8xLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMS5sbl8yLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMS5sbl8yLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMS5tbHAuY19mYy5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMS5tbHAuY19mYy5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMS5tbHAuY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMS5tbHAuY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMi5hdHRuLmNfYXR0bi5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMi5hdHRuLmNfYXR0bi5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMi5hdHRuLmNfcHJvai5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMi5hdHRuLmNfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMi5sbl8xLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMi5sbl8xLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMi5sbl8yLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMi5sbl8yLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMi5tbHAuY19mYy5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMi5tbHAuY19mYy5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMi5tbHAuY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMi5tbHAuY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMy5hdHRuLmNfYXR0bi5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMy5hdHRuLmNfYXR0bi5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMy5hdHRuLmNfcHJvai5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMy5hdHRuLmNfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMy5sbl8xLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMy5sbl8xLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMy5sbl8yLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMy5sbl8yLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMy5tbHAuY19mYy5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMy5tbHAuY19mYy5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMy5tbHAuY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguMy5tbHAuY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNC5hdHRuLmNfYXR0bi5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNC5hdHRuLmNfYXR0bi5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNC5hdHRuLmNfcHJvai5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNC5hdHRuLmNfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNC5sbl8xLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNC5sbl8xLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNC5sbl8yLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNC5sbl8yLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNC5tbHAuY19mYy5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNC5tbHAuY19mYy5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNC5tbHAuY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNC5tbHAuY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNS5hdHRuLmNfYXR0bi5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNS5hdHRuLmNfYXR0bi5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNS5hdHRuLmNfcHJvai5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNS5hdHRuLmNfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNS5sbl8xLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNS5sbl8xLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNS5sbl8yLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNS5sbl8yLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNS5tbHAuY19mYy5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNS5tbHAuY19mYy5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNS5tbHAuY19wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmguNS5tbHAuY19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmxuX2YuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLmxuX2Yuc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLnd0ZS5lbWJlZGRpbmc=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}","cGFyYW1zLnRyYW5zZm9ybWVyLndwZS5lbWJlZGRpbmc=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"cuda:0\"}"}
checkpoint_699/array_metadatas/process_0 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "step", "write_shape": [], "chunk_shape": [], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.0.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.0.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.0.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.0.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.0.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.0.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.0.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.0.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.0.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.0.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.0.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.0.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.1.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.1.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.1.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.1.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.1.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.1.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.1.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.1.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.1.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.1.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.1.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.1.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.2.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.2.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.2.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.2.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.2.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.2.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.2.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.2.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.2.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.2.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.2.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.2.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.3.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.3.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.3.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.3.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.3.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.3.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.3.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.3.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.3.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.3.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.3.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.3.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.4.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.4.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.4.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.4.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.4.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.4.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.4.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.4.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.4.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.4.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.4.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.4.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.5.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.5.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.5.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.5.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.5.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.5.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.5.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.5.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.5.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.5.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.5.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.h.5.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.ln_f.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.ln_f.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.wpe.embedding", "write_shape": [30, 512], "chunk_shape": [30, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "params.transformer.wte.embedding", "write_shape": [19, 512], "chunk_shape": [19, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.count", "write_shape": [], "chunk_shape": [], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.0.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.0.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.0.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.0.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.0.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.0.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.0.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.0.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.0.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.0.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.0.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.0.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.1.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.1.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.1.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.1.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.1.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.1.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.1.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.1.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.1.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.1.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.1.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.1.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.2.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.2.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.2.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.2.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.2.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.2.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.2.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.2.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.2.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.2.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.2.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.2.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.3.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.3.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.3.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.3.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.3.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.3.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.3.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.3.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.3.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.3.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.3.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.3.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.4.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.4.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.4.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.4.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.4.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.4.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.4.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.4.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.4.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.4.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.4.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.4.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.5.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.5.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.5.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.5.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.5.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.5.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.5.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.5.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.5.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.5.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.5.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.h.5.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.ln_f.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.ln_f.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.wpe.embedding", "write_shape": [30, 512], "chunk_shape": [30, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.mu.transformer.wte.embedding", "write_shape": [19, 512], "chunk_shape": [19, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.0.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.0.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.0.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.0.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.0.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.0.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.0.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.0.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.0.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.0.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.0.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.0.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.1.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.1.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.1.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.1.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.1.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.1.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.1.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.1.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.1.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.1.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.1.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.1.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.2.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.2.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.2.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.2.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.2.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.2.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.2.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.2.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.2.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.2.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.2.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.2.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.3.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.3.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.3.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.3.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.3.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.3.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.3.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.3.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.3.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.3.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.3.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.3.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.4.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.4.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.4.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.4.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.4.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.4.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.4.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.4.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.4.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.4.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.4.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.4.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.5.attn.c_attn.bias", "write_shape": [1536], "chunk_shape": [1536], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.5.attn.c_attn.kernel", "write_shape": [1536, 512], "chunk_shape": [1536, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.5.attn.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.5.attn.c_proj.kernel", "write_shape": [512, 512], "chunk_shape": [512, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.5.ln_1.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.5.ln_1.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.5.ln_2.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.5.ln_2.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.5.mlp.c_fc.bias", "write_shape": [2048], "chunk_shape": [2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.5.mlp.c_fc.kernel", "write_shape": [2048, 512], "chunk_shape": [2048, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.5.mlp.c_proj.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.h.5.mlp.c_proj.kernel", "write_shape": [512, 2048], "chunk_shape": [512, 2048], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.ln_f.bias", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.ln_f.scale", "write_shape": [512], "chunk_shape": [512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.wpe.embedding", "write_shape": [30, 512], "chunk_shape": [30, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.0.nu.transformer.wte.embedding", "write_shape": [19, 512], "chunk_shape": [19, 512], "ext_metadata": null}}, {"array_metadata": {"param_name": "opt_state.2.count", "write_shape": [], "chunk_shape": [], "ext_metadata": null}}, {"array_metadata": {"param_name": "dropout_rng", "write_shape": [4, 2], "chunk_shape": [4, 2], "ext_metadata": null}}]}
checkpoint_699/config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_function": "gelu_new",
3
+ "architectures": [
4
+ "GPT2LMHeadModel"
5
+ ],
6
+ "attn_pdrop": 0.1,
7
+ "bos_token_id": 50256,
8
+ "embd_pdrop": 0.1,
9
+ "eos_token_id": 50256,
10
+ "initializer_range": 0.02,
11
+ "layer_norm_epsilon": 1e-05,
12
+ "model_type": "gpt2",
13
+ "n_embd": 512,
14
+ "n_head": 8,
15
+ "n_inner": 2048,
16
+ "n_layer": 6,
17
+ "n_positions": 30,
18
+ "reorder_and_upcast_attn": false,
19
+ "resid_pdrop": 0.1,
20
+ "scale_attn_by_inverse_layer_idx": false,
21
+ "scale_attn_weights": true,
22
+ "summary_activation": null,
23
+ "summary_first_dropout": 0.1,
24
+ "summary_proj_to_labels": true,
25
+ "summary_type": "cls_index",
26
+ "summary_use_proj": true,
27
+ "transformers_version": "4.50.3",
28
+ "use_cache": true,
29
+ "vocab_size": 19
30
+ }
checkpoint_699/d/67b79e4fe6de42df91d9d08953c075a2 ADDED
Binary file (2.54 kB). View file
 
checkpoint_699/flax_model.msgpack ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:586cf7a0f4c6e9b13ab32472c2dfe2a8897e07f41d69782dd2290982543b28b6
3
+ size 75764174
checkpoint_699/generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 50256,
4
+ "eos_token_id": 50256,
5
+ "transformers_version": "4.50.3"
6
+ }
checkpoint_699/manifest.ocdbt ADDED
Binary file (117 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/0b40c133e9305812cc742f60d8a73010 ADDED
Binary file (422 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/12a84b9891bdce7f46e339d70ad78e35 ADDED
Binary file (425 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/27257186844697c506798cd6e8f4712d ADDED
Binary file (576 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/344efdaaa2958060c8d0ed5fabd9bcd8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23e319d711406b34d97462ed5b8daeba236bbda365e7854d8217a19c9961f7a1
3
+ size 23838742
checkpoint_699/ocdbt.process_0/d/3c843e166b3e122cc85abc7bc73f8ca8 ADDED
Binary file (529 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/4104bb52016845f085d7921f84c21d44 ADDED
Binary file (428 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/45a9f77615c7713cdf951285c64524af ADDED
Binary file (675 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/4e6c5352b3d2690e14ada02bda8d1037 ADDED
Binary file (606 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/5191648a34f198e3ea22153c72696b93 ADDED
Binary file (677 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/547e1b94e62a7b55e5225de962e03b16 ADDED
Binary file (427 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/591c649b2e8d5670a811253b19a9c69e ADDED
Binary file (573 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/5fadb0ed8cb6769d5123f852c5d05347 ADDED
Binary file (443 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/6555211bf5279b8bdf4122ff8077aa4d ADDED
Binary file (1.39 kB). View file
 
checkpoint_699/ocdbt.process_0/d/66352f50d3244947724f80c4639547ab ADDED
Binary file (37.4 kB). View file
 
checkpoint_699/ocdbt.process_0/d/6a05da5af6d4aaadc903363c07132161 ADDED
Binary file (575 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/70c24c1e5e3f8cc706784876be0c3433 ADDED
Binary file (1.28 kB). View file
 
checkpoint_699/ocdbt.process_0/d/77e9c5d9683b1df3273be5356706a413 ADDED
Binary file (655 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/8419f3a30b4e21dc95624fc60c6916fd ADDED
Binary file (433 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/8b225223672fc8b9b15a05c1ff22b74b ADDED
Binary file (424 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/91ab0ce968af08a2ee6f52e6ad98c6e5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f8dd32d755fabaaddf75cf7c8200a7663a31ac1a342f27ff668b704c128bafe
3
+ size 184382678
checkpoint_699/ocdbt.process_0/d/91f361b086f378ad2c6123141f66556d ADDED
Binary file (599 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/9911b0d501475ff605147cef11006a03 ADDED
Binary file (622 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/9cadda087dea1c5d5b67be9d039bff49 ADDED
Binary file (572 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/a2e9005c23bf8a4f418460bded2cabb4 ADDED
Binary file (596 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/a4401d680a0686aafaad9a76ce11c54d ADDED
Binary file (657 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/a44d962c52cdeaa1c19d6b8a205bf3aa ADDED
Binary file (413 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/ac144fd63f453f7b7df71a0721d82ab7 ADDED
Binary file (659 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/b00873e82df5877a979db1f44e6330f4 ADDED
Binary file (613 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/ba273621627b4079fa41a94a4ba5f6f6 ADDED
Binary file (653 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/bc2a08547865130a383e508235349b7f ADDED
Binary file (425 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/c1fbdc67d9d2df8e978a49eb6fe63261 ADDED
Binary file (578 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/cfd40bf4cc2e4c47e7cec089a8d2c65c ADDED
Binary file (578 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/da7a968977d95d0c46a56873e52e3e05 ADDED
Binary file (171 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/e5cb30c7f58f0a13efb550c310dd4b0f ADDED
Binary file (424 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/efae6cf5b45a30312b6bfa9447b1d8eb ADDED
Binary file (419 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/f2805f2712de39a8d2d6095c9d0a8da0 ADDED
Binary file (636 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/faea7553e0ae9a161834568ad2a5b6c3 ADDED
Binary file (571 Bytes). View file
 
checkpoint_699/ocdbt.process_0/d/ffc5d50bd91e5fc49fd0377f70d1a94e ADDED
Binary file (638 Bytes). View file
 
checkpoint_699/ocdbt.process_0/manifest.ocdbt ADDED
Binary file (371 Bytes). View file