Update config.pbtxt

This commit is contained in:
cheetahadmin 2025-10-20 04:41:24 +00:00
parent ccd9eb0e80
commit 4bb6be215e

@ -1,7 +1,7 @@
# Triton backend to use
name: "base-gemma-3-1b-it"
backend: "python"
max_batch_size: 4
max_batch_size: 8
# Triton should expect as input a single string
# input of variable length named 'text_input'
@ -119,7 +119,7 @@ parameters: [
{
key: "quantization",
value: {string_value: "int4"}
value: {string_value: "int8"}
}
]