name: "tinybert-familyhistory-de" backend: "python" max_batch_size: 0 input [ { name: "text" data_type: TYPE_STRING dims: [-1] } ] output [ { name: "output" data_type: TYPE_STRING dims: [-1] } ] instance_group [ { count: 1 kind: KIND_CPU } ] # CPU-specific optimizations optimization { execution_accelerators { cpu_execution_accelerator: [{ name: "openvino" }] } } # Performance tuning parameters parameters: { key: "INFERENCE_BATCH_SIZE" value: { string_value: "96" } } parameters: { key: "MAX_SEQUENCE_LENGTH" value: { string_value: "512" } }