Closed
Description
name: "ensemble"
platform: "ensemble"
max_batch_size: 128
input [
{
name: "text_input"
data_type: TYPE_STRING
dims: [ -1 ]
}
]
output [
{
name: "text_output"
data_type: TYPE_STRING
dims: [ -1, -1 ]
},
{
name: "output_token_lengths"
data_type: TYPE_INT32
dims: [ -1, -1 ]
}
]
ensemble_scheduling {
step [
{
model_name: "preprocessing"
model_version: -1
input_map {
key: "QUERY"
value: "text_input"
}
output_map {
key: "REQUEST_INPUT_LEN"
value: "_REQUEST_INPUT_LEN"
}
},
{
model_name: "tensorrt_llm"
model_version: -1
input_map {
key: "input_lengths"
value: "_REQUEST_INPUT_LEN"
}
output_map {
key: "output_ids"
value: "_TOKENS_BATCH"
}
},
{
model_name: "postprocessing"
model_version: -1
input_map {
key: "TOKENS_BATCH"
value: "_TOKENS_BATCH"
}
output_map {
key: "OUTPUT"
value: "text_output"
}
output_map {
key: "OUTPUT1"
value: "output_token_lengths"
}
}
]
}
This is my simplified description of the ensemble,
I want to know how to put
ensemble_scheduling --> model_name "preprocessing" --> output_map --> value: "_REQUEST_INPUT_LEN"
Take out this value
Are there any examples
Metadata
Metadata
Assignees
Labels
No labels