thisisHJLee commited on
Commit
3af1aba
Β·
1 Parent(s): 9d0436d

add tokenizer

Browse files
runs/Oct17_05-43-15_e6cad45de4b8/events.out.tfevents.1665985956.e6cad45de4b8.95.2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ab68a8b120c47e3dbf30afaa0db08135822158803a3e571052055bc4e0cf733
3
- size 5060
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee97845805357d852644966fa9393c3c3e71b1fbab78c412f3c117924b9320bd
3
+ size 8268
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]"}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|", "replace_word_delimiter_char": " ", "tokenizer_class": "Wav2Vec2CTCTokenizer"}
vocab.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"\n": 0, "0": 2, "1": 3, "2": 4, "3": 5, "4": 6, "5": 7, "6": 8, "7": 9, "8": 10, "9": 11, "a": 12, "b": 13, "c": 14, "h": 15, "l": 16, "m": 17, "n": 18, "p": 19, "s": 20, "t": 21, "z": 22, "γ„±": 23, "γ„²": 24, "γ„΄": 25, "γ„΅": 26, "γ„Ά": 27, "γ„·": 28, "γ„Έ": 29, "γ„Ή": 30, "γ„Ί": 31, "γ„»": 32, "γ„Ό": 33, "γ…€": 34, "ㅁ": 35, "γ…‚": 36, "γ…ƒ": 37, "γ…„": 38, "γ……": 39, "γ…†": 40, "γ…‡": 41, "γ…ˆ": 42, "γ…‰": 43, "γ…Š": 44, "γ…‹": 45, "γ…Œ": 46, "ㅍ": 47, "γ…Ž": 48, "ㅏ": 49, "ㅐ": 50, "γ…‘": 51, "γ…’": 52, "γ…“": 53, "γ…”": 54, "γ…•": 55, "γ…–": 56, "γ…—": 57, "γ…˜": 58, "γ…™": 59, "γ…š": 60, "γ…›": 61, "γ…œ": 62, "ㅝ": 63, "γ…ž": 64, "γ…Ÿ": 65, "γ… ": 66, "γ…‘": 67, "γ…’": 68, "γ…£": 69, ",": 70, "|": 1, "[UNK]": 71, "[PAD]": 72}