File size: 2,405 Bytes
8589396
 
 
 
 
 
 
 
 
 
 
 
 
 
6daac7d
 
bcc9199
6daac7d
 
 
 
 
c1350f8
 
 
 
6daac7d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
bcc9199
 
 
 
 
 
 
 
 
 
6daac7d
8589396
 
 
 
 
6daac7d
 
bcc9199
6daac7d
 
 
 
 
c1350f8
 
 
 
6daac7d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
bcc9199
 
 
 
 
 
 
 
 
 
6daac7d
8589396
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
{
  "$schema": "https://huggingface.co/software-mansion/react-native-executorch-spec/resolve/main/config.schema.json",
  "model": "phi_4_mini",
  "family": "phi",
  "capabilities": [
    "text-generation"
  ],
  "backend": "xnnpack",
  "license": "mit",
  "variants": [
    {
      "file": "phi_4_mini_xnnpack_bf16.pte",
      "precision": "bf16",
      "quantized": false,
      "default": true,
      "methods": {
        "enable_dynamic_shape": true,
        "forward": {
          "inputs": [
            {
              "shape": [
                1,
                {
                  "min": 1,
                  "max": 2048
                }
              ],
              "dtype": "int64"
            },
            {
              "shape": [
                1
              ],
              "dtype": "int64"
            }
          ],
          "outputs": [
            {
              "shape": [
                1,
                200064
              ],
              "dtype": "bfloat16"
            }
          ]
        },
        "get_bos_id": 151643,
        "get_eos_ids": [
          151643
        ],
        "get_max_context_len": 128,
        "get_max_seq_len": 128,
        "get_n_layers": null,
        "get_vocab_size": 200064,
        "use_kv_cache": true,
        "use_sdpa_with_kv_cache": true
      }
    },
    {
      "file": "phi_4_mini_xnnpack_8da4w.pte",
      "precision": "8da4w",
      "quantized": true,
      "default": true,
      "methods": {
        "enable_dynamic_shape": true,
        "forward": {
          "inputs": [
            {
              "shape": [
                1,
                {
                  "min": 1,
                  "max": 2048
                }
              ],
              "dtype": "int64"
            },
            {
              "shape": [
                1
              ],
              "dtype": "int64"
            }
          ],
          "outputs": [
            {
              "shape": [
                1,
                200064
              ],
              "dtype": "float32"
            }
          ]
        },
        "get_bos_id": 151643,
        "get_eos_ids": [
          151643
        ],
        "get_max_context_len": 128,
        "get_max_seq_len": 128,
        "get_n_layers": null,
        "get_vocab_size": 200064,
        "use_kv_cache": true,
        "use_sdpa_with_kv_cache": true
      }
    }
  ]
}