Commit
Β·
5726c4f
1
Parent(s):
54f5d84
add tokenizer
Browse files
runs/Oct19_06-28-56_0e4cdf942af6/events.out.tfevents.1666161780.0e4cdf942af6.9735.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53abfe94201314a371ce848b8d9f8493e11f6cb9d7e92d44a150b99824ba2979
|
3 |
+
size 9206
|
special_tokens_map.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]"}
|
tokenizer_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|", "replace_word_delimiter_char": " ", "tokenizer_class": "Wav2Vec2CTCTokenizer"}
|
vocab.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"\n": 0, "0": 2, "1": 3, "2": 4, "3": 5, "4": 6, "5": 7, "6": 8, "7": 9, "8": 10, "9": 11, "a": 12, "b": 13, "c": 14, "h": 15, "l": 16, "m": 17, "n": 18, "o": 19, "p": 20, "s": 21, "t": 22, "z": 23, "γ±": 24, "γ²": 25, "γ΄": 26, "γ΅": 27, "γΆ": 28, "γ·": 29, "γΈ": 30, "γΉ": 31, "γΊ": 32, "γ»": 33, "γΌ": 34, "γΎ": 35, "γ
": 36, "γ
": 37, "γ
": 38, "γ
": 39, "γ
": 40, "γ
": 41, "γ
": 42, "γ
": 43, "γ
": 44, "γ
": 45, "γ
": 46, "γ
": 47, "γ
": 48, "γ
": 49, "γ
": 50, "γ
": 51, "γ
": 52, "γ
": 53, "γ
": 54, "γ
": 55, "γ
": 56, "γ
": 57, "γ
": 58, "γ
": 59, "γ
": 60, "γ
": 61, "γ
": 62, "γ
": 63, "γ
": 64, "γ
": 65, "γ
": 66, "γ
": 67, "γ
": 68, "γ
‘": 69, "γ
’": 70, "γ
£": 71, "οΌ": 72, "|": 1, "[UNK]": 73, "[PAD]": 74}
|