Upload tokenizer_config.json
Browse files- tokenizer_config.json +2 -1
tokenizer_config.json
CHANGED
@@ -8007,10 +8007,11 @@
|
|
8007 |
"bos_token": "[gMASK]<sop>",
|
8008 |
"clean_up_tokenization_spaces": false,
|
8009 |
"eos_token": "<|endoftext|>",
|
|
|
8010 |
"extra_special_tokens": {},
|
8011 |
"model_max_length": 131072,
|
8012 |
"pad_token": "<pad>",
|
8013 |
"padding_side": "left",
|
8014 |
-
"tokenizer_class": "
|
8015 |
"unk_token": "<unk>"
|
8016 |
}
|
|
|
8007 |
"bos_token": "[gMASK]<sop>",
|
8008 |
"clean_up_tokenization_spaces": false,
|
8009 |
"eos_token": "<|endoftext|>",
|
8010 |
+
"chat_template": "{{ bos_token }}{%- set loop_messages = messages %}\n{%- for message in loop_messages %}\n {%- set content = '<|' + message['role'] + '|>'+ message['content'] | trim %}\n {%- if loop.index0 == 0 %}\n {%- set content = content %}\n {%- endif %}\n {%- if not (loop.last and message['role'] == 'assistant') %}\n {%- set content = content + '<|endoftext|>' %}\n {%- endif %}\n {{- content }}\n{%- endfor %}\n{%- if messages[-1]['role'] != 'assistant' %}\n {{- '<|assistant|>' }}\n{%- endif %}",
|
8011 |
"extra_special_tokens": {},
|
8012 |
"model_max_length": 131072,
|
8013 |
"pad_token": "<pad>",
|
8014 |
"padding_side": "left",
|
8015 |
+
"tokenizer_class": "PreTrainedTokenizerFast",
|
8016 |
"unk_token": "<unk>"
|
8017 |
}
|