File size: 2,550 Bytes
2bcc764
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7b0cd98
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2bcc764
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
{
  "tokenizer_dir": "tokenizer",
  "tokenizer_max_length": 77,
  "vocab_size": 49408,
  "preferred_token_dtype": "int32",
  "fallback_token_dtype": "int64",
  "dtype_attempt_order": [
    "int32",
    "int64"
  ],
  "variants": {
    "fp32": {
      "requested_token_dtype": "int32",
      "exported_input_name": "serving_default_args_0",
      "exported_input_dtype": "INT32",
      "exported_input_shape": [
        1,
        77
      ],
      "token_range": [
        267,
        49407
      ],
      "gpu_delegate_friendly": true
    },
    "int8": {
      "requested_token_dtype": "int32",
      "exported_input_name": "serving_default_args_0",
      "exported_input_dtype": "INT32",
      "exported_input_shape": [
        1,
        77
      ],
      "token_range": [
        267,
        49407
      ],
      "gpu_delegate_friendly": true
    },
    "android-qnn-npu": {
      "requested_token_dtype": "int32",
      "exported_input_name": "serving_default_args_0",
      "exported_input_dtype": "INT32",
      "exported_input_shape": [
        1,
        77
      ],
      "token_range": [
        267,
        49407
      ],
      "gpu_delegate_friendly": true,
      "source_variant": "fp32",
      "profile_name": "android-qnn-npu"
    },
    "android-cpu": {
      "requested_token_dtype": "int32",
      "exported_input_name": "serving_default_args_0",
      "exported_input_dtype": "INT32",
      "exported_input_shape": [
        1,
        77
      ],
      "token_range": [
        267,
        49407
      ],
      "gpu_delegate_friendly": true,
      "source_variant": "fp32",
      "profile_name": "android-cpu"
    },
    "android-gpu": {
      "requested_token_dtype": "int32",
      "exported_input_name": "serving_default_args_0",
      "exported_input_dtype": "INT32",
      "exported_input_shape": [
        1,
        77
      ],
      "token_range": [
        267,
        49407
      ],
      "gpu_delegate_friendly": true,
      "source_variant": "fp32",
      "profile_name": "android-gpu"
    },
    "ios-coreml": {
      "requested_token_dtype": "int32",
      "exported_input_name": "serving_default_args_0",
      "exported_input_dtype": "INT32",
      "exported_input_shape": [
        1,
        77
      ],
      "token_range": [
        267,
        49407
      ],
      "gpu_delegate_friendly": true,
      "source_variant": "fp32",
      "profile_name": "ios-coreml"
    }
  },
  "notes": "Tokenizer output is external to the exported model. Token IDs are vocabulary indices and are not int8-quantized."
}