playwebit / tokenizer.json
mike23415's picture
Create tokenizer.json
2a59d94 verified
raw
history blame
465 Bytes
{
"version": "1.0",
"truncation": null,
"padding": null,
"added_tokens": [],
"normalizer": null,
"pre_tokenizer": null,
"post_processor": null,
"decoder": null,
"model": {
"type": "BPE",
"dropout": null,
"unk_token": "<UNK>",
"continuing_subword_prefix": null,
"end_of_word_suffix": null,
"fuse_unk": false,
"vocab": {
"<PAD>": 0,
"<BOS>": 1,
"<EOS>": 2,
"<UNK>": 3
},
"merges": []
}
}