moyixiao's picture
Upload folder using huggingface_hub
1773fbd verified
{"array_metadatas": [{"array_metadata": {"param_name": "embedding_layer.pos_emb.embedding.value", "write_shape": [64, 128], "chunk_shape": [64, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "embedding_layer.token_emb.embedding.value", "write_shape": [50258, 32], "chunk_shape": [50258, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "output_layer.bias.value", "write_shape": [25129], "chunk_shape": [25129], "ext_metadata": null}}, {"array_metadata": {"param_name": "output_layer.kernel.value", "write_shape": [64, 25129], "chunk_shape": [64, 25129], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.layer_norm1.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.layer_norm1.scale.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.layer_norm2.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.layer_norm2.scale.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.linear1.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.linear1.kernel.value", "write_shape": [64, 128], "chunk_shape": [64, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.linear2.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.linear2.kernel.value", "write_shape": [64, 128], "chunk_shape": [64, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.mha.key.bias.value", "write_shape": [1, 32], "chunk_shape": [1, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.mha.key.kernel.value", "write_shape": [64, 4, 32], "chunk_shape": [64, 4, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.mha.out.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.mha.out.kernel.value", "write_shape": [2, 16, 256], "chunk_shape": [2, 16, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.mha.query.bias.value", "write_shape": [1, 32], "chunk_shape": [1, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.mha.query.kernel.value", "write_shape": [64, 4, 32], "chunk_shape": [64, 4, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.mha.value.bias.value", "write_shape": [1, 32], "chunk_shape": [1, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.0.mha.value.kernel.value", "write_shape": [64, 4, 32], "chunk_shape": [64, 4, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.layer_norm1.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.layer_norm1.scale.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.layer_norm2.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.layer_norm2.scale.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.linear1.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.linear1.kernel.value", "write_shape": [64, 128], "chunk_shape": [64, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.linear2.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.linear2.kernel.value", "write_shape": [64, 128], "chunk_shape": [64, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.mha.key.bias.value", "write_shape": [1, 32], "chunk_shape": [1, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.mha.key.kernel.value", "write_shape": [64, 4, 32], "chunk_shape": [64, 4, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.mha.out.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.mha.out.kernel.value", "write_shape": [2, 16, 256], "chunk_shape": [2, 16, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.mha.query.bias.value", "write_shape": [1, 32], "chunk_shape": [1, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.mha.query.kernel.value", "write_shape": [64, 4, 32], "chunk_shape": [64, 4, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.mha.value.bias.value", "write_shape": [1, 32], "chunk_shape": [1, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.1.mha.value.kernel.value", "write_shape": [64, 4, 32], "chunk_shape": [64, 4, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.layer_norm1.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.layer_norm1.scale.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.layer_norm2.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.layer_norm2.scale.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.linear1.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.linear1.kernel.value", "write_shape": [64, 128], "chunk_shape": [64, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.linear2.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.linear2.kernel.value", "write_shape": [64, 128], "chunk_shape": [64, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.mha.key.bias.value", "write_shape": [1, 32], "chunk_shape": [1, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.mha.key.kernel.value", "write_shape": [64, 4, 32], "chunk_shape": [64, 4, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.mha.out.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.mha.out.kernel.value", "write_shape": [2, 16, 256], "chunk_shape": [2, 16, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.mha.query.bias.value", "write_shape": [1, 32], "chunk_shape": [1, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.mha.query.kernel.value", "write_shape": [64, 4, 32], "chunk_shape": [64, 4, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.mha.value.bias.value", "write_shape": [1, 32], "chunk_shape": [1, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.2.mha.value.kernel.value", "write_shape": [64, 4, 32], "chunk_shape": [64, 4, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.layer_norm1.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.layer_norm1.scale.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.layer_norm2.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.layer_norm2.scale.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.linear1.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.linear1.kernel.value", "write_shape": [64, 128], "chunk_shape": [64, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.linear2.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.linear2.kernel.value", "write_shape": [64, 128], "chunk_shape": [64, 128], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.mha.key.bias.value", "write_shape": [1, 32], "chunk_shape": [1, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.mha.key.kernel.value", "write_shape": [64, 4, 32], "chunk_shape": [64, 4, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.mha.out.bias.value", "write_shape": [32], "chunk_shape": [32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.mha.out.kernel.value", "write_shape": [2, 16, 256], "chunk_shape": [2, 16, 256], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.mha.query.bias.value", "write_shape": [1, 32], "chunk_shape": [1, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.mha.query.kernel.value", "write_shape": [64, 4, 32], "chunk_shape": [64, 4, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.mha.value.bias.value", "write_shape": [1, 32], "chunk_shape": [1, 32], "ext_metadata": null}}, {"array_metadata": {"param_name": "transformer_blocks.3.mha.value.kernel.value", "write_shape": [64, 4, 32], "chunk_shape": [64, 4, 32], "ext_metadata": null}}]}