Update config.pbtxt
This commit is contained in:
parent
f354f143a2
commit
5d5173ea23
@ -1,7 +1,7 @@
|
|||||||
# Triton backend to use
|
# Triton backend to use
|
||||||
name: "base-gemma-3-1b-it"
|
name: "base-gemma-3-1b-it"
|
||||||
backend: "python"
|
backend: "python"
|
||||||
max_batch_size: 4
|
max_batch_size: 5
|
||||||
|
|
||||||
# Triton should expect as input a single string
|
# Triton should expect as input a single string
|
||||||
# input of variable length named 'text_input'
|
# input of variable length named 'text_input'
|
||||||
@ -125,8 +125,8 @@ parameters: [
|
|||||||
|
|
||||||
instance_group [
|
instance_group [
|
||||||
{
|
{
|
||||||
kind: KIND_CPU
|
kind: KIND_GPU
|
||||||
count: 8
|
count: 7
|
||||||
}
|
}
|
||||||
]
|
]
|
||||||
|
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user