patrickvonplaten Xenova HF Staff commited on
Commit
4f81d78
·
verified ·
1 Parent(s): 4d14c1d

Do not add eos token by default (#8)

Browse files

- Do not add eos token by default (6d762032ac7adbc536dd25d458a13b59454b24cb)
- Update .gitattributes (1230593151b8a1e8f3de1f18958236404ed9b21c)
- Upload tokenizer.json (fdc0b188cb40e0a2e60574fce18079145c51e434)


Co-authored-by: Joshua <[email protected]>

Files changed (3) hide show
  1. .gitattributes +0 -1
  2. tokenizer.json +0 -0
  3. tokenizer_config.json +2 -0
.gitattributes CHANGED
@@ -34,4 +34,3 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  tekken.json filter=lfs diff=lfs merge=lfs -text
37
- tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  tekken.json filter=lfs diff=lfs merge=lfs -text
 
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,4 +1,6 @@
1
  {
 
 
2
  "add_prefix_space": false,
3
  "added_tokens_decoder": {
4
  "0": {
 
1
  {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
  "add_prefix_space": false,
5
  "added_tokens_decoder": {
6
  "0": {