Compare commits

..

3 Commits

Author SHA1 Message Date
766fca2517 Create New File 2025-04-30 07:32:46 +00:00
5b9d078db3 Automatically created by CHEETAH 2025-04-23 12:51:13 +00:00
98684d5814 Automatically created by CHEETAH 2025-04-23 12:51:12 +00:00
12 changed files with 13 additions and 38 deletions

@ -2,7 +2,6 @@ import triton_python_backend_utils as pb_utils
from transformers import AutoModelForCausalLM, AutoTokenizer, GenerationConfig from transformers import AutoModelForCausalLM, AutoTokenizer, GenerationConfig
import numpy as np import numpy as np
import json import json
import os
class TritonPythonModel: class TritonPythonModel:
def initialize(self, args): def initialize(self, args):
@ -13,27 +12,9 @@ class TritonPythonModel:
""" """
self.logger = pb_utils.Logger self.logger = pb_utils.Logger
current_file_path = os.path.abspath(__file__)
self.logger.log_info(f"current_file_path: {current_file_path}")
self.model_name = args["model_name"] self.model_name = args["model_name"]
model_repository = args["model_repository"] model_repository = args["model_repository"]
model_path = f"{model_repository}/{self.model_name}" model_path = f"{model_repository}/{self.model_name}"
#model_path = "/cheetah/input/model/gemma-3-1b-it/gemma-3-1b-it"
input_model_path = model_path
if os.path.exists(input_model_path):
file_list = os.listdir(input_model_path)
self.logger.log_info(f"'{input_model_path}' 디렉토리의 파일 목록:")
for file_name in file_list:
self.logger.log_info(file_name)
else:
self.logger.log_info(f"'{input_model_path}' 디렉토리가 존재하지 않습니다.")
self.logger.log_info(f"model_repository: {model_repository}")
self.logger.log_info(f"model_path: {model_path}")
self.model_config = json.loads(args["model_config"]) self.model_config = json.loads(args["model_config"])

@ -1,6 +1,3 @@
test.txt test.txt
test.txt test.txt
test.txt test.txt
test.txt
test.txt

@ -1,7 +1,6 @@
# Triton backend to use
name: "gemma-3-1b-it" name: "gemma-3-1b-it"
backend: "python"
max_batch_size: 0 max_batch_size: 0
backend: "python"
# Triton should expect as input a single string # Triton should expect as input a single string
# input of variable length named 'text_input' # input of variable length named 'text_input'
@ -72,7 +71,6 @@ output [
} }
] ]
parameters: [ parameters: [
{ {
key: "enable_inference_trace", key: "enable_inference_trace",
@ -86,4 +84,3 @@ instance_group [
count: 1 count: 1
} }
] ]