Bc-AI's picture
Upload folder using huggingface_hub
80cee68 verified
{"array_metadatas": [{"array_metadata": {"param_name": "embed_tokens.embedding", "write_shape": [50264, 768], "chunk_shape": [50264, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.input_proj.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.input_proj.kernel", "write_shape": [768, 384], "chunk_shape": [768, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.output_proj.bias", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.bidirectional_rnn.output_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_0.rnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_1.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_10.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_11.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.input_proj.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.input_proj.kernel", "write_shape": [768, 384], "chunk_shape": [768, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.output_proj.bias", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.bidirectional_rnn.output_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_12.rnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_13.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_14.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_15.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.input_proj.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.input_proj.kernel", "write_shape": [768, 384], "chunk_shape": [768, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.output_proj.bias", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.bidirectional_rnn.output_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_16.rnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_17.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_18.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_19.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_2.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.input_proj.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.input_proj.kernel", "write_shape": [768, 384], "chunk_shape": [768, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.output_proj.bias", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.bidirectional_rnn.output_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_20.rnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_21.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_22.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_23.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_3.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.input_proj.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.input_proj.kernel", "write_shape": [768, 384], "chunk_shape": [768, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.output_proj.bias", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.bidirectional_rnn.output_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_4.rnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_5.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_6.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_7.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.backward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.backward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.forward_cell.MinGRUCell_0.candidate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.forward_cell.MinGRUCell_0.gate.kernel", "write_shape": [384, 384], "chunk_shape": [384, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.input_proj.bias", "write_shape": [384], "chunk_shape": [384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.input_proj.kernel", "write_shape": [768, 384], "chunk_shape": [768, 384], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.output_proj.bias", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.bidirectional_rnn.output_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_8.rnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.attn.k_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.attn.o_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.attn.q_proj.kernel", "write_shape": [768, 768], "chunk_shape": [768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.attn.v_proj.kernel", "write_shape": [768, 128], "chunk_shape": [768, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.attn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.cnn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.ffn.down_proj.kernel", "write_shape": [1920, 768], "chunk_shape": [1920, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.ffn.gate_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.ffn.up_proj.kernel", "write_shape": [768, 1920], "chunk_shape": [768, 1920], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.ffn_norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.conv3.depthwise.kernel", "write_shape": [3, 1, 768], "chunk_shape": [3, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.conv3.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.conv5.depthwise.kernel", "write_shape": [5, 1, 768], "chunk_shape": [5, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.conv5.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.conv7.depthwise.kernel", "write_shape": [7, 1, 768], "chunk_shape": [7, 1, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.conv7.pointwise.kernel", "write_shape": [1, 768, 768], "chunk_shape": [1, 768, 768], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.fusion_gate.bias", "write_shape": [2304], "chunk_shape": [2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.fusion_gate.kernel", "write_shape": [768, 2304], "chunk_shape": [768, 2304], "ext_metadata": null}}, {"array_metadata": {"param_name": "layers_9.local_cnn.layer_scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}, {"array_metadata": {"param_name": "lm_head.kernel", "write_shape": [768, 50264], "chunk_shape": [768, 50264], "ext_metadata": null}}, {"array_metadata": {"param_name": "norm.scale", "write_shape": [768], "chunk_shape": [768], "ext_metadata": null}}]}