# Triton backend to use name: "yolo11-tensorrt" backend: "tensorrt" platform: "tensorrt_plan" max_batch_size: 0 default_model_filename: "yolo11n.engine" input [ { name: "images" data_type: TYPE_FP32 dims: [1, 3, 640, 640] } ] # Triton should expect to respond with a single string # output of variable length named 'text_output' output [ { name: "output0" data_type: TYPE_FP32 dims: [1, 84, 8400] } ] instance_group [ { kind: KIND_AUTO count: 1 } ]