From 5d5173ea23f597cf8fdb69fb89b5246ddd2e8acb Mon Sep 17 00:00:00 2001 From: cheetahadmin Date: Fri, 17 Oct 2025 09:54:47 +0000 Subject: [PATCH] Update config.pbtxt --- config.pbtxt | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/config.pbtxt b/config.pbtxt index 5d90dc8..185add8 100644 --- a/config.pbtxt +++ b/config.pbtxt @@ -1,7 +1,7 @@ # Triton backend to use name: "base-gemma-3-1b-it" backend: "python" -max_batch_size: 4 +max_batch_size: 5 # Triton should expect as input a single string # input of variable length named 'text_input' @@ -125,8 +125,8 @@ parameters: [ instance_group [ { - kind: KIND_CPU - count: 8 + kind: KIND_GPU + count: 7 } ]