From a8977699a3d0820e80129fb3c93c20fbd9972c41 Mon Sep 17 00:00:00 2001 From: Arthur Zucker Date: Fri, 10 May 2024 06:24:30 +0000 Subject: [PATCH] Update tokenizer_config.json (#60) - Update tokenizer_config.json (81e3437ab8e8e883c74b96df85196f3434c39d1c) Co-authored-by: NAVANIT DUBEY --- tokenizer_config.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tokenizer_config.json b/tokenizer_config.json index 870479e..1bfd114 100644 --- a/tokenizer_config.json +++ b/tokenizer_config.json @@ -2052,7 +2052,7 @@ "bos_token": "<|begin_of_text|>", "chat_template": "{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% endif %}", "clean_up_tokenization_spaces": true, - "eos_token": "<|end_of_text|>", + "eos_token": "<|eot_id|>", "model_input_names": [ "input_ids", "attention_mask"