thisisHJLee commited on
Commit
5726c4f
Β·
1 Parent(s): 54f5d84

add tokenizer

Browse files
runs/Oct19_06-28-56_0e4cdf942af6/events.out.tfevents.1666161780.0e4cdf942af6.9735.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:99255eb4180c03e175a45086d34bc34860285e10b92d04b1038811f9b28fa306
3
- size 5217
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53abfe94201314a371ce848b8d9f8493e11f6cb9d7e92d44a150b99824ba2979
3
+ size 9206
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]"}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|", "replace_word_delimiter_char": " ", "tokenizer_class": "Wav2Vec2CTCTokenizer"}
vocab.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"\n": 0, "0": 2, "1": 3, "2": 4, "3": 5, "4": 6, "5": 7, "6": 8, "7": 9, "8": 10, "9": 11, "a": 12, "b": 13, "c": 14, "h": 15, "l": 16, "m": 17, "n": 18, "o": 19, "p": 20, "s": 21, "t": 22, "z": 23, "γ„±": 24, "γ„²": 25, "γ„΄": 26, "γ„΅": 27, "γ„Ά": 28, "γ„·": 29, "γ„Έ": 30, "γ„Ή": 31, "γ„Ί": 32, "γ„»": 33, "γ„Ό": 34, "γ„Ύ": 35, "γ…€": 36, "ㅁ": 37, "γ…‚": 38, "γ…ƒ": 39, "γ…„": 40, "γ……": 41, "γ…†": 42, "γ…‡": 43, "γ…ˆ": 44, "γ…‰": 45, "γ…Š": 46, "γ…‹": 47, "γ…Œ": 48, "ㅍ": 49, "γ…Ž": 50, "ㅏ": 51, "ㅐ": 52, "γ…‘": 53, "γ…’": 54, "γ…“": 55, "γ…”": 56, "γ…•": 57, "γ…–": 58, "γ…—": 59, "γ…˜": 60, "γ…™": 61, "γ…š": 62, "γ…›": 63, "γ…œ": 64, "ㅝ": 65, "γ…ž": 66, "γ…Ÿ": 67, "γ… ": 68, "γ…‘": 69, "γ…’": 70, "γ…£": 71, ",": 72, "|": 1, "[UNK]": 73, "[PAD]": 74}