From 7437bf7190063e007371ed31a42b687259d27d15 Mon Sep 17 00:00:00 2001 From: cheetahadmin Date: Thu, 13 Nov 2025 05:05:02 +0000 Subject: [PATCH] Update config.pbtxt --- config.pbtxt | 95 ++-------------------------------------------------- 1 file changed, 2 insertions(+), 93 deletions(-) diff --git a/config.pbtxt b/config.pbtxt index dd8edcc..69a0ad8 100644 --- a/config.pbtxt +++ b/config.pbtxt @@ -5,97 +5,20 @@ max_batch_size: 0 # Triton should expect as input a single string # input of variable length named 'text_input' input [ - { name: "text_input" data_type: TYPE_STRING dims: [ -1 ] - - - }, - { - name: "max_length" - data_type: TYPE_INT32 - dims: [ 1 ] - - optional: true - - - }, - { - name: "max_new_tokens" - data_type: TYPE_INT32 - dims: [ 1 ] - - optional: true - - - }, - { - name: "do_sample" - data_type: TYPE_BOOL - dims: [ 1 ] - - optional: true - - - }, - { - name: "top_k" - data_type: TYPE_INT32 - dims: [ 1 ] - - optional: true - - - }, - { - name: "top_p" - data_type: TYPE_FP32 - dims: [ 1 ] - - optional: true - - - }, - { - name: "temperature" - data_type: TYPE_FP32 - dims: [ 1 ] - - optional: true - - - }, - { - name: "repetition_penalty" - data_type: TYPE_FP32 - dims: [ 1 ] - - optional: true - - - }, - { - name: "stream" - data_type: TYPE_BOOL - dims: [ 1 ] - - optional: true - - } - ] -# Triton should expect to respond with a single string -# output of variable length named 'text_output' +# output of variable length named 'embedding_outputt' output [ { name: "embedding_output" data_type: TYPE_FP32 # 또는 TYPE_FP16 - dims: [ -1, -1 ] # [seq_len, hidden_size] + dims: [ -1, -1 ] # [seq_len, hidden_size] } ] @@ -103,19 +26,6 @@ parameters: [ { key: "base_model_path", value: {string_value: "/cheetah/input/model/groupuser/codesage-large-v2"} - }, - { - key: "is_adapter_model", - value: {string_value: "false"} - }, - { - key: "adapter_model_path", - value: {string_value: ""} - }, - - { - key: "quantization", - value: {string_value: "none"} } ] @@ -125,4 +35,3 @@ instance_group [ count: 1 } ] -