Update config.pbtxt

This commit is contained in:
cheetahadmin 2025-10-20 06:05:16 +00:00
parent 6c7148c0bf
commit 576866e68c

@ -1,7 +1,7 @@
# Triton backend to use
name: "base-gemma-3-1b-it"
backend: "python"
max_batch_size: 150
max_batch_size: 200
# Triton should expect as input a single string
# input of variable length named 'text_input'
@ -119,7 +119,7 @@ parameters: [
{
key: "quantization",
value: {string_value: "int4"}
value: {string_value: "int8"}
}
]