Update config.pbtxt
This commit is contained in:
parent
a1841e0300
commit
6c7148c0bf
@ -1,7 +1,7 @@
|
|||||||
# Triton backend to use
|
# Triton backend to use
|
||||||
name: "base-gemma-3-1b-it"
|
name: "base-gemma-3-1b-it"
|
||||||
backend: "python"
|
backend: "python"
|
||||||
max_batch_size: 15
|
max_batch_size: 150
|
||||||
|
|
||||||
# Triton should expect as input a single string
|
# Triton should expect as input a single string
|
||||||
# input of variable length named 'text_input'
|
# input of variable length named 'text_input'
|
||||||
@ -119,7 +119,7 @@ parameters: [
|
|||||||
|
|
||||||
{
|
{
|
||||||
key: "quantization",
|
key: "quantization",
|
||||||
value: {string_value: "int8"}
|
value: {string_value: "int4"}
|
||||||
}
|
}
|
||||||
]
|
]
|
||||||
|
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user