NorbertKlockiewicz's picture
Use min/max dynamic shape bounds for forward inputs/outputs
c1350f8
Raw
History Blame Contribute Delete
2.41 kB
{
"$schema": "https://huggingface.co/software-mansion/react-native-executorch-spec/resolve/main/config.schema.json",
"model": "phi_4_mini",
"family": "phi",
"capabilities": [
"text-generation"
],
"backend": "xnnpack",
"license": "mit",
"variants": [
{
"file": "phi_4_mini_xnnpack_bf16.pte",
"precision": "bf16",
"quantized": false,
"default": true,
"methods": {
"enable_dynamic_shape": true,
"forward": {
"inputs": [
{
"shape": [
1,
{
"min": 1,
"max": 2048
}
],
"dtype": "int64"
},
{
"shape": [
1
],
"dtype": "int64"
}
],
"outputs": [
{
"shape": [
1,
200064
],
"dtype": "bfloat16"
}
]
},
"get_bos_id": 151643,
"get_eos_ids": [
151643
],
"get_max_context_len": 128,
"get_max_seq_len": 128,
"get_n_layers": null,
"get_vocab_size": 200064,
"use_kv_cache": true,
"use_sdpa_with_kv_cache": true
}
},
{
"file": "phi_4_mini_xnnpack_8da4w.pte",
"precision": "8da4w",
"quantized": true,
"default": true,
"methods": {
"enable_dynamic_shape": true,
"forward": {
"inputs": [
{
"shape": [
1,
{
"min": 1,
"max": 2048
}
],
"dtype": "int64"
},
{
"shape": [
1
],
"dtype": "int64"
}
],
"outputs": [
{
"shape": [
1,
200064
],
"dtype": "float32"
}
]
},
"get_bos_id": 151643,
"get_eos_ids": [
151643
],
"get_max_context_len": 128,
"get_max_seq_len": 128,
"get_n_layers": null,
"get_vocab_size": 200064,
"use_kv_cache": true,
"use_sdpa_with_kv_cache": true
}
}
]
}