Upload folder using huggingface_hub
Browse files- .gitattributes +3 -0
- README.md +19 -3
- checkpoints/best_3/_CHECKPOINT_METADATA +1 -0
- checkpoints/best_3/_METADATA +0 -0
- checkpoints/best_3/_sharding +1 -0
- checkpoints/best_3/array_metadatas/process_0 +1 -0
- checkpoints/best_3/d/d3999bfe67b6938c1d92978857dcd7d7 +0 -0
- checkpoints/best_3/manifest.ocdbt +0 -0
- checkpoints/best_3/ocdbt.process_0/d/12555194630aea1da36c360692d1c4c5 +0 -0
- checkpoints/best_3/ocdbt.process_0/d/2c524767bb010c8821efa98be1a98f41 +0 -0
- checkpoints/best_3/ocdbt.process_0/d/44ce11d5e07f9723cbe43bc2a1629291 +0 -0
- checkpoints/best_3/ocdbt.process_0/d/5efcb09927bf847895632c9d8fa8fdc3 +0 -0
- checkpoints/best_3/ocdbt.process_0/d/6892b4c2675051d496d152389bea4b4e +0 -0
- checkpoints/best_3/ocdbt.process_0/d/6ccb0ffef8c236498ffb8a1e4e498ed2 +3 -0
- checkpoints/best_3/ocdbt.process_0/d/a3fea488f1f0ffe3e25e7bceb4bc56dc +0 -0
- checkpoints/best_3/ocdbt.process_0/d/bb55d9a458b396ebd67ced981b9a5b98 +3 -0
- checkpoints/best_3/ocdbt.process_0/d/f8354f21218e18ee6fdd6383739e5045 +3 -0
- checkpoints/best_3/ocdbt.process_0/manifest.ocdbt +0 -0
- config.json +16 -0
- model.safetensors +3 -0
- tokenizer.json +0 -0
- tokenizer_config.json +6 -0
- training_history.csv +4 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
checkpoints/best_3/ocdbt.process_0/d/6ccb0ffef8c236498ffb8a1e4e498ed2 filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
checkpoints/best_3/ocdbt.process_0/d/bb55d9a458b396ebd67ced981b9a5b98 filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
checkpoints/best_3/ocdbt.process_0/d/f8354f21218e18ee6fdd6383739e5045 filter=lfs diff=lfs merge=lfs -text
|
README.md
CHANGED
|
@@ -1,3 +1,19 @@
|
|
| 1 |
-
|
| 2 |
-
|
| 3 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# SAM1 Hybrid Model
|
| 2 |
+
|
| 3 |
+
## Architecture
|
| 4 |
+
- Transformer + CNN + RNN
|
| 5 |
+
- Parameters: 253,748,736 (~253.7M)
|
| 6 |
+
- 24L × 768d × 12H
|
| 7 |
+
|
| 8 |
+
## Usage
|
| 9 |
+
```python
|
| 10 |
+
from transformers import AutoTokenizer, AutoModelForCausalLM
|
| 11 |
+
|
| 12 |
+
tokenizer = AutoTokenizer.from_pretrained("path/to/model")
|
| 13 |
+
model = AutoModelForCausalLM.from_pretrained("path/to/model")
|
| 14 |
+
|
| 15 |
+
prompt = "User: Hello!\nSam:"
|
| 16 |
+
inputs = tokenizer(prompt, return_tensors="pt")
|
| 17 |
+
outputs = model.generate(**inputs, max_length=100)
|
| 18 |
+
print(tokenizer.decode(outputs[0]))
|
| 19 |
+
```
|
checkpoints/best_3/_CHECKPOINT_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"item_handlers": "orbax.checkpoint._src.handlers.pytree_checkpoint_handler.PyTreeCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1762584927751970288, "commit_timestamp_nsecs": 1762584937500587047, "custom_metadata": {}}
|
checkpoints/best_3/_METADATA
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
checkpoints/best_3/_sharding
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"ZW1iZWRfdG9rZW5zLmVtYmVkZGluZw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bG1faGVhZC5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuY25uX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYXR0bi52X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYXR0bi5rX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYXR0bi5vX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYXR0bi5xX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYXR0bl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4uYmFja3dhcmRfY2VsbC5NaW5HUlVDZWxsXzAuY2FuZGlkYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4uYmFja3dhcmRfY2VsbC5NaW5HUlVDZWxsXzAuY2FuZGlkYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4uYmFja3dhcmRfY2VsbC5NaW5HUlVDZWxsXzAuZ2F0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4uYmFja3dhcmRfY2VsbC5NaW5HUlVDZWxsXzAuZ2F0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4uZm9yd2FyZF9jZWxsLk1pbkdSVUNlbGxfMC5jYW5kaWRhdGUuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4uZm9yd2FyZF9jZWxsLk1pbkdSVUNlbGxfMC5jYW5kaWRhdGUua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4uZm9yd2FyZF9jZWxsLk1pbkdSVUNlbGxfMC5nYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4uZm9yd2FyZF9jZWxsLk1pbkdSVUNlbGxfMC5nYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4uaW5wdXRfcHJvai5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4uaW5wdXRfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4ub3V0cHV0X3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4ub3V0cHV0X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuYmlkaXJlY3Rpb25hbF9ybm4ubGF5ZXJfc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuZmZuLmRvd25fcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuZmZuLmdhdGVfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuZmZuLnVwX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAuZmZuX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAubG9jYWxfY25uLmNvbnY1LmRlcHRod2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAubG9jYWxfY25uLmNvbnY1LnBvaW50d2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAubG9jYWxfY25uLmNvbnY3LmRlcHRod2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAubG9jYWxfY25uLmNvbnY3LnBvaW50d2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAubG9jYWxfY25uLmNvbnYzLmRlcHRod2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAubG9jYWxfY25uLmNvbnYzLnBvaW50d2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAubG9jYWxfY25uLmZ1c2lvbl9nYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAubG9jYWxfY25uLmZ1c2lvbl9nYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAubG9jYWxfY25uLmxheWVyX3NjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzAucm5uX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE0LmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE0LmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE0LmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE0LmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE0LmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE0LmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE0LmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE0LmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE0LmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmNubl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmxvY2FsX2Nubi5jb252My5kZXB0aHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmxvY2FsX2Nubi5jb252My5wb2ludHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmxvY2FsX2Nubi5jb252NS5kZXB0aHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmxvY2FsX2Nubi5jb252NS5wb2ludHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmxvY2FsX2Nubi5jb252Ny5kZXB0aHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmxvY2FsX2Nubi5jb252Ny5wb2ludHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmxvY2FsX2Nubi5mdXNpb25fZ2F0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmxvY2FsX2Nubi5mdXNpb25fZ2F0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE1LmxvY2FsX2Nubi5sYXllcl9zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLm91dHB1dF9wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLm91dHB1dF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLmJhY2t3YXJkX2NlbGwuTWluR1JVQ2VsbF8wLmNhbmRpZGF0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLmJhY2t3YXJkX2NlbGwuTWluR1JVQ2VsbF8wLmNhbmRpZGF0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLmJhY2t3YXJkX2NlbGwuTWluR1JVQ2VsbF8wLmdhdGUuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLmJhY2t3YXJkX2NlbGwuTWluR1JVQ2VsbF8wLmdhdGUua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLmZvcndhcmRfY2VsbC5NaW5HUlVDZWxsXzAuY2FuZGlkYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLmZvcndhcmRfY2VsbC5NaW5HUlVDZWxsXzAuY2FuZGlkYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLmZvcndhcmRfY2VsbC5NaW5HUlVDZWxsXzAuZ2F0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLmZvcndhcmRfY2VsbC5NaW5HUlVDZWxsXzAuZ2F0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLmlucHV0X3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLmlucHV0X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmJpZGlyZWN0aW9uYWxfcm5uLmxheWVyX3NjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE2LnJubl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE3LmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE3LmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE3LmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE3LmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE3LmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE3LmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE3LmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE3LmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE3LmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmNubl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmxvY2FsX2Nubi5jb252My5kZXB0aHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmxvY2FsX2Nubi5jb252My5wb2ludHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmxvY2FsX2Nubi5jb252NS5kZXB0aHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmxvY2FsX2Nubi5jb252NS5wb2ludHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmxvY2FsX2Nubi5jb252Ny5kZXB0aHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmxvY2FsX2Nubi5jb252Ny5wb2ludHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmxvY2FsX2Nubi5mdXNpb25fZ2F0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmxvY2FsX2Nubi5mdXNpb25fZ2F0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE4LmxvY2FsX2Nubi5sYXllcl9zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE5LmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE5LmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE5LmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE5LmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE5LmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE5LmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE5LmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE5LmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzE5LmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEuYXR0bi52X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEuYXR0bi5rX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEuYXR0bi5vX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEuYXR0bi5xX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEuYXR0bl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEuZmZuLmRvd25fcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEuZmZuLmdhdGVfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEuZmZuLnVwX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEuZmZuX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEwLmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEwLmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEwLmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEwLmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEwLmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEwLmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEwLmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEwLmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEwLmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzExLmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzExLmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzExLmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzExLmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzExLmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzExLmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzExLmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzExLmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzExLmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLm91dHB1dF9wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLm91dHB1dF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLmJhY2t3YXJkX2NlbGwuTWluR1JVQ2VsbF8wLmNhbmRpZGF0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLmJhY2t3YXJkX2NlbGwuTWluR1JVQ2VsbF8wLmNhbmRpZGF0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLmJhY2t3YXJkX2NlbGwuTWluR1JVQ2VsbF8wLmdhdGUuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLmJhY2t3YXJkX2NlbGwuTWluR1JVQ2VsbF8wLmdhdGUua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLmZvcndhcmRfY2VsbC5NaW5HUlVDZWxsXzAuY2FuZGlkYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLmZvcndhcmRfY2VsbC5NaW5HUlVDZWxsXzAuY2FuZGlkYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLmZvcndhcmRfY2VsbC5NaW5HUlVDZWxsXzAuZ2F0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLmZvcndhcmRfY2VsbC5NaW5HUlVDZWxsXzAuZ2F0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLmlucHV0X3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLmlucHV0X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmJpZGlyZWN0aW9uYWxfcm5uLmxheWVyX3NjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmNubl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmxvY2FsX2Nubi5jb252My5kZXB0aHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmxvY2FsX2Nubi5jb252My5wb2ludHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmxvY2FsX2Nubi5jb252NS5kZXB0aHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmxvY2FsX2Nubi5jb252NS5wb2ludHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmxvY2FsX2Nubi5jb252Ny5kZXB0aHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmxvY2FsX2Nubi5jb252Ny5wb2ludHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmxvY2FsX2Nubi5mdXNpb25fZ2F0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmxvY2FsX2Nubi5mdXNpb25fZ2F0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLmxvY2FsX2Nubi5sYXllcl9zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEyLnJubl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEzLmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEzLmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEzLmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEzLmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEzLmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEzLmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEzLmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEzLmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzEzLmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIuYXR0bi52X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIuYXR0bi5rX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIuYXR0bi5vX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIuYXR0bi5xX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIuYXR0bl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIuZmZuLmRvd25fcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIuZmZuLmdhdGVfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIuZmZuLnVwX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIuZmZuX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLm91dHB1dF9wcm9qLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLm91dHB1dF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLmJhY2t3YXJkX2NlbGwuTWluR1JVQ2VsbF8wLmNhbmRpZGF0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLmJhY2t3YXJkX2NlbGwuTWluR1JVQ2VsbF8wLmNhbmRpZGF0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLmJhY2t3YXJkX2NlbGwuTWluR1JVQ2VsbF8wLmdhdGUuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLmJhY2t3YXJkX2NlbGwuTWluR1JVQ2VsbF8wLmdhdGUua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLmZvcndhcmRfY2VsbC5NaW5HUlVDZWxsXzAuY2FuZGlkYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLmZvcndhcmRfY2VsbC5NaW5HUlVDZWxsXzAuY2FuZGlkYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLmZvcndhcmRfY2VsbC5NaW5HUlVDZWxsXzAuZ2F0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLmZvcndhcmRfY2VsbC5NaW5HUlVDZWxsXzAuZ2F0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLmlucHV0X3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLmlucHV0X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmJpZGlyZWN0aW9uYWxfcm5uLmxheWVyX3NjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIwLnJubl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmNubl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmxvY2FsX2Nubi5jb252My5kZXB0aHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmxvY2FsX2Nubi5jb252My5wb2ludHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmxvY2FsX2Nubi5jb252NS5kZXB0aHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmxvY2FsX2Nubi5jb252NS5wb2ludHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmxvY2FsX2Nubi5jb252Ny5kZXB0aHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmxvY2FsX2Nubi5jb252Ny5wb2ludHdpc2Uua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmxvY2FsX2Nubi5mdXNpb25fZ2F0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmxvY2FsX2Nubi5mdXNpb25fZ2F0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIxLmxvY2FsX2Nubi5sYXllcl9zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIyLmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIyLmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIyLmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIyLmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIyLmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIyLmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIyLmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIyLmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIyLmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIzLmF0dG4ua19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIzLmF0dG4ub19wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIzLmF0dG4ucV9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIzLmF0dG4udl9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIzLmF0dG5fbm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIzLmZmbi51cF9wcm9qLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIzLmZmbi5kb3duX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIzLmZmbi5nYXRlX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzIzLmZmbl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMuY25uX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMuYXR0bi52X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMuYXR0bi5rX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMuYXR0bi5vX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMuYXR0bi5xX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMuYXR0bl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMuZmZuLmRvd25fcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMuZmZuLmdhdGVfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMuZmZuLnVwX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMuZmZuX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMubG9jYWxfY25uLmNvbnY1LmRlcHRod2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMubG9jYWxfY25uLmNvbnY1LnBvaW50d2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMubG9jYWxfY25uLmNvbnY3LmRlcHRod2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMubG9jYWxfY25uLmNvbnY3LnBvaW50d2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMubG9jYWxfY25uLmNvbnYzLmRlcHRod2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMubG9jYWxfY25uLmNvbnYzLnBvaW50d2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMubG9jYWxfY25uLmZ1c2lvbl9nYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMubG9jYWxfY25uLmZ1c2lvbl9nYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzMubG9jYWxfY25uLmxheWVyX3NjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYXR0bi52X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYXR0bi5rX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYXR0bi5vX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYXR0bi5xX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYXR0bl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4uYmFja3dhcmRfY2VsbC5NaW5HUlVDZWxsXzAuY2FuZGlkYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4uYmFja3dhcmRfY2VsbC5NaW5HUlVDZWxsXzAuY2FuZGlkYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4uYmFja3dhcmRfY2VsbC5NaW5HUlVDZWxsXzAuZ2F0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4uYmFja3dhcmRfY2VsbC5NaW5HUlVDZWxsXzAuZ2F0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4uZm9yd2FyZF9jZWxsLk1pbkdSVUNlbGxfMC5jYW5kaWRhdGUuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4uZm9yd2FyZF9jZWxsLk1pbkdSVUNlbGxfMC5jYW5kaWRhdGUua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4uZm9yd2FyZF9jZWxsLk1pbkdSVUNlbGxfMC5nYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4uZm9yd2FyZF9jZWxsLk1pbkdSVUNlbGxfMC5nYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4uaW5wdXRfcHJvai5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4uaW5wdXRfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4ub3V0cHV0X3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4ub3V0cHV0X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuYmlkaXJlY3Rpb25hbF9ybm4ubGF5ZXJfc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuZmZuLmRvd25fcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuZmZuLmdhdGVfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuZmZuLnVwX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQuZmZuX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzQucm5uX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzUuYXR0bi52X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzUuYXR0bi5rX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzUuYXR0bi5vX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzUuYXR0bi5xX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzUuYXR0bl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzUuZmZuLmRvd25fcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzUuZmZuLmdhdGVfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzUuZmZuLnVwX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzUuZmZuX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYuY25uX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYuYXR0bi52X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYuYXR0bi5rX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYuYXR0bi5vX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYuYXR0bi5xX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYuYXR0bl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYuZmZuLmRvd25fcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYuZmZuLmdhdGVfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYuZmZuLnVwX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYuZmZuX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYubG9jYWxfY25uLmNvbnY1LmRlcHRod2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYubG9jYWxfY25uLmNvbnY1LnBvaW50d2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYubG9jYWxfY25uLmNvbnY3LmRlcHRod2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYubG9jYWxfY25uLmNvbnY3LnBvaW50d2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYubG9jYWxfY25uLmNvbnYzLmRlcHRod2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYubG9jYWxfY25uLmNvbnYzLnBvaW50d2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYubG9jYWxfY25uLmZ1c2lvbl9nYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYubG9jYWxfY25uLmZ1c2lvbl9nYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzYubG9jYWxfY25uLmxheWVyX3NjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzcuYXR0bi52X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzcuYXR0bi5rX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzcuYXR0bi5vX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzcuYXR0bi5xX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzcuYXR0bl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzcuZmZuLmRvd25fcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzcuZmZuLmdhdGVfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzcuZmZuLnVwX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzcuZmZuX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYXR0bi52X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYXR0bi5rX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYXR0bi5vX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYXR0bi5xX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYXR0bl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4uYmFja3dhcmRfY2VsbC5NaW5HUlVDZWxsXzAuY2FuZGlkYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4uYmFja3dhcmRfY2VsbC5NaW5HUlVDZWxsXzAuY2FuZGlkYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4uYmFja3dhcmRfY2VsbC5NaW5HUlVDZWxsXzAuZ2F0ZS5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4uYmFja3dhcmRfY2VsbC5NaW5HUlVDZWxsXzAuZ2F0ZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4uZm9yd2FyZF9jZWxsLk1pbkdSVUNlbGxfMC5jYW5kaWRhdGUuYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4uZm9yd2FyZF9jZWxsLk1pbkdSVUNlbGxfMC5jYW5kaWRhdGUua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4uZm9yd2FyZF9jZWxsLk1pbkdSVUNlbGxfMC5nYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4uZm9yd2FyZF9jZWxsLk1pbkdSVUNlbGxfMC5nYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4uaW5wdXRfcHJvai5iaWFz":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4uaW5wdXRfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4ub3V0cHV0X3Byb2ouYmlhcw==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4ub3V0cHV0X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguYmlkaXJlY3Rpb25hbF9ybm4ubGF5ZXJfc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguZmZuLmRvd25fcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguZmZuLmdhdGVfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguZmZuLnVwX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzguZmZuX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzgucm5uX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkuY25uX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkuYXR0bi52X3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkuYXR0bi5rX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkuYXR0bi5vX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkuYXR0bi5xX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkuYXR0bl9ub3JtLnNjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkuZmZuLmRvd25fcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkuZmZuLmdhdGVfcHJvai5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkuZmZuLnVwX3Byb2oua2VybmVs":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkuZmZuX25vcm0uc2NhbGU=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkubG9jYWxfY25uLmNvbnY1LmRlcHRod2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkubG9jYWxfY25uLmNvbnY1LnBvaW50d2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkubG9jYWxfY25uLmNvbnY3LmRlcHRod2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkubG9jYWxfY25uLmNvbnY3LnBvaW50d2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkubG9jYWxfY25uLmNvbnYzLmRlcHRod2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkubG9jYWxfY25uLmNvbnYzLnBvaW50d2lzZS5rZXJuZWw=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkubG9jYWxfY25uLmZ1c2lvbl9nYXRlLmJpYXM=":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkubG9jYWxfY25uLmZ1c2lvbl9nYXRlLmtlcm5lbA==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bGF5ZXJzXzkubG9jYWxfY25uLmxheWVyX3NjYWxl":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}","bm9ybS5zY2FsZQ==":"{\"sharding_type\": \"SingleDeviceSharding\", \"device_str\": \"TPU_0(process=0,(0,0,0,0))\"}"}
|
checkpoints/best_3/array_metadatas/process_0
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"array_metadatas": [{"array_metadata": {"param_name": "embed_tokens.embedding", "write_shape": [50264, 768], "chunk_shape": [50264, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.input_proj.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.input_proj.kernel", "write_shape": [768, 384], "chunk_shape": [768, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.output_proj.bias", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.output_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.rnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.input_proj.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.input_proj.kernel", "write_shape": [768, 384], "chunk_shape": [768, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.output_proj.bias", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.output_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.rnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.input_proj.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.input_proj.kernel", "write_shape": [768, 384], "chunk_shape": [768, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.output_proj.bias", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.output_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.rnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.input_proj.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.input_proj.kernel", "write_shape": [768, 384], "chunk_shape": [768, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.output_proj.bias", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.output_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.rnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.input_proj.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.input_proj.kernel", "write_shape": [768, 384], "chunk_shape": [768, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.output_proj.bias", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.output_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.rnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.input_proj.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.input_proj.kernel", "write_shape": [768, 384], "chunk_shape": [768, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.output_proj.bias", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.output_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.rnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "lm_head.kernel", "write_shape": [768, 50264], "chunk_shape": [768, 50264], "ext_metadata": null}}, {"array_metadata": {"param_name": "norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}]}
|
checkpoints/best_3/d/d3999bfe67b6938c1d92978857dcd7d7
ADDED
|
Binary file (4.56 kB). View file
|
|
|
checkpoints/best_3/manifest.ocdbt
ADDED
|
Binary file (118 Bytes). View file
|
|
|
checkpoints/best_3/ocdbt.process_0/d/12555194630aea1da36c360692d1c4c5
ADDED
|
Binary file (1.2 kB). View file
|
|
|
checkpoints/best_3/ocdbt.process_0/d/2c524767bb010c8821efa98be1a98f41
ADDED
|
Binary file (1.41 kB). View file
|
|
|
checkpoints/best_3/ocdbt.process_0/d/44ce11d5e07f9723cbe43bc2a1629291
ADDED
|
Binary file (1.31 kB). View file
|
|
|
checkpoints/best_3/ocdbt.process_0/d/5efcb09927bf847895632c9d8fa8fdc3
ADDED
|
Binary file (197 Bytes). View file
|
|
|
checkpoints/best_3/ocdbt.process_0/d/6892b4c2675051d496d152389bea4b4e
ADDED
|
Binary file (14.2 kB). View file
|
|
|
checkpoints/best_3/ocdbt.process_0/d/6ccb0ffef8c236498ffb8a1e4e498ed2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ecff57681e7e45ffdee77a1c4e390df400372273d8ddc5fb5a7116123d011354
|
| 3 |
+
size 136159232
|
checkpoints/best_3/ocdbt.process_0/d/a3fea488f1f0ffe3e25e7bceb4bc56dc
ADDED
|
Binary file (951 Bytes). View file
|
|
|
checkpoints/best_3/ocdbt.process_0/d/bb55d9a458b396ebd67ced981b9a5b98
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1ae05a8714fd55a707b35e7f50038fa7025aa13d98c38aea5ace632153b4e6e
|
| 3 |
+
size 43171840
|
checkpoints/best_3/ocdbt.process_0/d/f8354f21218e18ee6fdd6383739e5045
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a81bd0d163751586cd2e6d715948f2541d329adac2a58be285e5aec48fb4db62
|
| 3 |
+
size 753119232
|
checkpoints/best_3/ocdbt.process_0/manifest.ocdbt
ADDED
|
Binary file (467 Bytes). View file
|
|
|
config.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_type": "sam1_hybrid",
|
| 3 |
+
"vocab_size": 50264,
|
| 4 |
+
"d_model": 768,
|
| 5 |
+
"n_layers": 24,
|
| 6 |
+
"n_heads": 12,
|
| 7 |
+
"n_kv_heads": 2,
|
| 8 |
+
"ff_dim": 1920,
|
| 9 |
+
"max_len": 1024,
|
| 10 |
+
"use_cnn": true,
|
| 11 |
+
"use_rnn": true,
|
| 12 |
+
"rnn_hidden": 384,
|
| 13 |
+
"architectures": [
|
| 14 |
+
"SAM1HybridForCausalLM"
|
| 15 |
+
]
|
| 16 |
+
}
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d49da73ae7aeb5a335f93023fdb50ed6cb7d8954fd6d4f1221e5f7affa0b354
|
| 3 |
+
size 1015036512
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"tokenizer_class": "GPT2Tokenizer",
|
| 3 |
+
"chat_template": "User: {{input}}\nSam: {{output}}",
|
| 4 |
+
"eos_token": "<|endoftext|>",
|
| 5 |
+
"model_max_length": 1024
|
| 6 |
+
}
|
training_history.csv
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
train_loss,train_ce,train_z,train_acc,train_ppl,val_loss,val_ce,val_z,val_acc,val_ppl
|
| 2 |
+
0.9324811697006226,0.9301027059555054,0.0023784860968589783,0.9747710824012756,34.463226318359375,0.7455353140830994,0.7454673051834106,6.797964306315407e-05,0.9994805455207825,2.1074304580688477
|
| 3 |
+
0.7442176342010498,0.7441790103912354,3.8648839108645916e-05,0.9995428323745728,2.1047160625457764,0.7447968125343323,0.7447550296783447,4.179905590717681e-05,0.9995492100715637,2.1059272289276123
|
| 4 |
+
0.743730902671814,0.7437002062797546,3.068605292355642e-05,0.9995979070663452,2.1037073135375977,0.7445427179336548,0.7445056438446045,3.705303242895752e-05,0.9995689392089844,2.1054019927978516
|