hieupth
chore: add onnx model
fcba339 unverified
name: "viencoder"
# maximum batch size
max_batch_size: 0
platform: "ensemble"
#input to the model
input [
{
name: "TEXT"
data_type: TYPE_STRING
dims: [ -1 ]
# -1 means dynamic axis, aka this dimension may change
}
]
#output of the model
output {
name: "output_0"
data_type: TYPE_FP32
dims: [-1, -1]
# two dimensional tensor, where 1st dimension: batch-size, 2nd dimension: #classes
}
#Type of scheduler to be used
ensemble_scheduling {
step [
{
model_name: "viencoder.tokenizer"
model_version: -1
input_map {
key: "TEXT"
value: "TEXT"
}
output_map [
{
key: "input_ids"
value: "input_ids"
},
{
key: "attention_mask"
value: "attention_mask"
}
]
},
{
model_name: "viencoder.model"
model_version: -1
input_map [
{
key: "input_ids"
value: "input_ids"
},
{
key: "attention_mask"
value: "attention_mask"
}
]
output_map {
key: "sentence_embedding"
value: "output_0"
}
}
]
}