PocketDoc commited on
Commit
6e05cfc
·
verified ·
1 Parent(s): 1cb9777

Upload tokenizer_config.json

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +2 -1
tokenizer_config.json CHANGED
@@ -8007,10 +8007,11 @@
8007
  "bos_token": "[gMASK]<sop>",
8008
  "clean_up_tokenization_spaces": false,
8009
  "eos_token": "<|endoftext|>",
 
8010
  "extra_special_tokens": {},
8011
  "model_max_length": 131072,
8012
  "pad_token": "<pad>",
8013
  "padding_side": "left",
8014
- "tokenizer_class": "PreTrainedTokenizer",
8015
  "unk_token": "<unk>"
8016
  }
 
8007
  "bos_token": "[gMASK]<sop>",
8008
  "clean_up_tokenization_spaces": false,
8009
  "eos_token": "<|endoftext|>",
8010
+ "chat_template": "{{ bos_token }}{%- set loop_messages = messages %}\n{%- for message in loop_messages %}\n {%- set content = '<|' + message['role'] + '|>'+ message['content'] | trim %}\n {%- if loop.index0 == 0 %}\n {%- set content = content %}\n {%- endif %}\n {%- if not (loop.last and message['role'] == 'assistant') %}\n {%- set content = content + '<|endoftext|>' %}\n {%- endif %}\n {{- content }}\n{%- endfor %}\n{%- if messages[-1]['role'] != 'assistant' %}\n {{- '<|assistant|>' }}\n{%- endif %}",
8011
  "extra_special_tokens": {},
8012
  "model_max_length": 131072,
8013
  "pad_token": "<pad>",
8014
  "padding_side": "left",
8015
+ "tokenizer_class": "PreTrainedTokenizerFast",
8016
  "unk_token": "<unk>"
8017
  }