{ "added_tokens_decoder": { "0": { "content": "<|endoftext|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "1": { "content": "<|padding|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "2": { "content": "<|mask|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "3": { "content": "<|user|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "4": { "content": "<|assistant|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "5": { "content": "<|system|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "6": { "content": "<|end|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "7": { "content": "<|en|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "8": { "content": "<|ru|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "9": { "content": "<|tok|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "10": { "content": "<|", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "11": { "content": "|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true } }, "additional_special_tokens": [ "<|endoftext|>", "<|padding|>", "<|mask|>", "<|user|>", "<|assistant|>", "<|system|>", "<|end|>", "<|en|>", "<|ru|>", "<|tok|>", "<|", "|>" ], "bos_token": "<|endoftext|>", "chat_template": "{% for message in messages %}{% if message['lang'] %}{{ \"<|\" + message['lang'] + \"|>\" }}{% endif %}{{ \"<|\" + message['role'] + \"|>\" }}{{ message['content'] }}<|end|>{% endfor %}", "clean_up_tokenization_spaces": false, "eos_token": "<|end|>", "extra_special_tokens": {}, "mask_token": "<|mask|>", "max_length": 65536, "model_max_length": 65536, "pad_to_multiple_of": 8, "pad_token": "<|padding|>", "pad_token_type_id": 0, "padding_side": "left", "stride": 0, "tokenizer_class": "PreTrainedTokenizer", "truncation_side": "left", "truncation_strategy": "longest_first", "unk_token": "<|endoftext|>" }