Update config.pbtxt

This commit is contained in:
cheetahadmin 2025-10-20 05:20:39 +00:00
parent dd8eb6c342
commit a1841e0300

@ -130,3 +130,20 @@ instance_group [
}
]
# "model": {
# "name": "Llama-3.2-1B-Instruct",
# "backend": "TransformerLLM",
# "tensorrtllm": {
# "workers": 1,
# "maxSeqLen": 1,
# "kvCacheType": "paged",
# "maxInputLen": 1024,
# "maxNumTokens": 0
# },
# "maxBatchSize": 4,
# "quantization": "int4",
# "modelInstanceGroupKind": "KIND_GPU",
# "modelInstanceGroupCount": 1
# }