Bertug1911 commited on
Commit
f21ce1c
·
verified ·
1 Parent(s): 8928057

Update tokenizer_config.json

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +16 -3
tokenizer_config.json CHANGED
@@ -1,5 +1,6 @@
1
  {
2
- "max_lenght": 1024,
 
3
  "added_tokens_decoder": {
4
  "0": {
5
  "content": "<|BOS|>",
@@ -40,6 +41,18 @@
40
  "rstrip": false,
41
  "single_word": false,
42
  "special": true
43
- },
44
- }
 
 
 
 
 
 
 
 
 
 
 
 
45
  }
 
1
  {
2
+ "add_bos_token": false,
3
+ "add_eos_token": false,
4
  "added_tokens_decoder": {
5
  "0": {
6
  "content": "<|BOS|>",
 
41
  "rstrip": false,
42
  "single_word": false,
43
  "special": true
44
+ }
45
+ },
46
+ "bos_token": "<|BOS|>",
47
+ "clean_up_tokenization_spaces": true,
48
+ "eos_token": "<|im_end|>",
49
+ "extra_special_tokens": {},
50
+ "legacy": false,
51
+ "max_length": 1024,
52
+ "pad_token": "<|pad|>",
53
+ "sp_model_kwargs": {},
54
+ "spaces_between_special_tokens": false,
55
+ "tokenizer_class": "PreTrainedTokenizerFast",
56
+ "use_default_system_prompt": false,
57
+ "use_fast": true
58
  }