Update config.pbtxt

This commit is contained in:
groupuser 2025-10-20 04:43:53 +00:00
parent 4bb6be215e
commit 38602559b5

@ -1,7 +1,7 @@
# Triton backend to use
name: "base-gemma-3-1b-it"
backend: "python"
max_batch_size: 8
max_batch_size: 5
# Triton should expect as input a single string
# input of variable length named 'text_input'
@ -119,7 +119,7 @@ parameters: [
{
key: "quantization",
value: {string_value: "int8"}
value: {string_value: "int4"}
}
]