Commit
Β·
3af1aba
1
Parent(s):
9d0436d
add tokenizer
Browse files
runs/Oct17_05-43-15_e6cad45de4b8/events.out.tfevents.1665985956.e6cad45de4b8.95.2
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee97845805357d852644966fa9393c3c3e71b1fbab78c412f3c117924b9320bd
|
3 |
+
size 8268
|
special_tokens_map.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]"}
|
tokenizer_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|", "replace_word_delimiter_char": " ", "tokenizer_class": "Wav2Vec2CTCTokenizer"}
|
vocab.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"\n": 0, "0": 2, "1": 3, "2": 4, "3": 5, "4": 6, "5": 7, "6": 8, "7": 9, "8": 10, "9": 11, "a": 12, "b": 13, "c": 14, "h": 15, "l": 16, "m": 17, "n": 18, "p": 19, "s": 20, "t": 21, "z": 22, "γ±": 23, "γ²": 24, "γ΄": 25, "γ΅": 26, "γΆ": 27, "γ·": 28, "γΈ": 29, "γΉ": 30, "γΊ": 31, "γ»": 32, "γΌ": 33, "γ
": 34, "γ
": 35, "γ
": 36, "γ
": 37, "γ
": 38, "γ
": 39, "γ
": 40, "γ
": 41, "γ
": 42, "γ
": 43, "γ
": 44, "γ
": 45, "γ
": 46, "γ
": 47, "γ
": 48, "γ
": 49, "γ
": 50, "γ
": 51, "γ
": 52, "γ
": 53, "γ
": 54, "γ
": 55, "γ
": 56, "γ
": 57, "γ
": 58, "γ
": 59, "γ
": 60, "γ
": 61, "γ
": 62, "γ
": 63, "γ
": 64, "γ
": 65, "γ
": 66, "γ
‘": 67, "γ
’": 68, "γ
£": 69, "οΌ": 70, "|": 1, "[UNK]": 71, "[PAD]": 72}
|