File size: 2,550 Bytes
2bcc764 7b0cd98 2bcc764 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 | {
"tokenizer_dir": "tokenizer",
"tokenizer_max_length": 77,
"vocab_size": 49408,
"preferred_token_dtype": "int32",
"fallback_token_dtype": "int64",
"dtype_attempt_order": [
"int32",
"int64"
],
"variants": {
"fp32": {
"requested_token_dtype": "int32",
"exported_input_name": "serving_default_args_0",
"exported_input_dtype": "INT32",
"exported_input_shape": [
1,
77
],
"token_range": [
267,
49407
],
"gpu_delegate_friendly": true
},
"int8": {
"requested_token_dtype": "int32",
"exported_input_name": "serving_default_args_0",
"exported_input_dtype": "INT32",
"exported_input_shape": [
1,
77
],
"token_range": [
267,
49407
],
"gpu_delegate_friendly": true
},
"android-qnn-npu": {
"requested_token_dtype": "int32",
"exported_input_name": "serving_default_args_0",
"exported_input_dtype": "INT32",
"exported_input_shape": [
1,
77
],
"token_range": [
267,
49407
],
"gpu_delegate_friendly": true,
"source_variant": "fp32",
"profile_name": "android-qnn-npu"
},
"android-cpu": {
"requested_token_dtype": "int32",
"exported_input_name": "serving_default_args_0",
"exported_input_dtype": "INT32",
"exported_input_shape": [
1,
77
],
"token_range": [
267,
49407
],
"gpu_delegate_friendly": true,
"source_variant": "fp32",
"profile_name": "android-cpu"
},
"android-gpu": {
"requested_token_dtype": "int32",
"exported_input_name": "serving_default_args_0",
"exported_input_dtype": "INT32",
"exported_input_shape": [
1,
77
],
"token_range": [
267,
49407
],
"gpu_delegate_friendly": true,
"source_variant": "fp32",
"profile_name": "android-gpu"
},
"ios-coreml": {
"requested_token_dtype": "int32",
"exported_input_name": "serving_default_args_0",
"exported_input_dtype": "INT32",
"exported_input_shape": [
1,
77
],
"token_range": [
267,
49407
],
"gpu_delegate_friendly": true,
"source_variant": "fp32",
"profile_name": "ios-coreml"
}
},
"notes": "Tokenizer output is external to the exported model. Token IDs are vocabulary indices and are not int8-quantized."
} |