Update config.pbtxt

This commit is contained in:
cheetahadmin 2025-10-20 05:47:30 +00:00
parent a1841e0300
commit 6c7148c0bf

@ -1,7 +1,7 @@
# Triton backend to use # Triton backend to use
name: "base-gemma-3-1b-it" name: "base-gemma-3-1b-it"
backend: "python" backend: "python"
max_batch_size: 15 max_batch_size: 150
# Triton should expect as input a single string # Triton should expect as input a single string
# input of variable length named 'text_input' # input of variable length named 'text_input'
@ -119,7 +119,7 @@ parameters: [
{ {
key: "quantization", key: "quantization",
value: {string_value: "int8"} value: {string_value: "int4"}
} }
] ]