jackJessada commited on
Commit
f337c0b
·
verified ·
1 Parent(s): 0a4104c

Upload folder using huggingface_hub

Browse files
Modelfile ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # ollama modelfile auto-generated by llamafactory
2
+
3
+ FROM .
4
+
5
+ TEMPLATE """<bos>{{ if .System }}{{ .System }}
6
+
7
+ {{ end }}{{ range .Messages }}{{ if eq .Role "user" }}<start_of_turn>user
8
+ {{ .Content }}<end_of_turn>
9
+ <start_of_turn>model
10
+ {{ else if eq .Role "assistant" }}{{ .Content }}<end_of_turn>
11
+ {{ end }}{{ end }}"""
12
+
13
+ PARAMETER stop "<eos>"
14
+ PARAMETER stop "<end_of_turn>"
15
+ PARAMETER num_ctx 4096
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<image_soft_token>": 262144
3
+ }
config.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Gemma3ForConditionalGeneration"
4
+ ],
5
+ "boi_token_index": 255999,
6
+ "eoi_token_index": 256000,
7
+ "hidden_size": 5376,
8
+ "image_token_index": 262144,
9
+ "initializer_range": 0.02,
10
+ "mm_tokens_per_image": 256,
11
+ "model_type": "gemma3",
12
+ "text_config": {
13
+ "attention_bias": false,
14
+ "attention_dropout": 0.0,
15
+ "attn_logit_softcapping": null,
16
+ "cache_implementation": "hybrid",
17
+ "final_logit_softcapping": null,
18
+ "head_dim": 128,
19
+ "hidden_activation": "gelu_pytorch_tanh",
20
+ "hidden_size": 5376,
21
+ "initializer_range": 0.02,
22
+ "intermediate_size": 21504,
23
+ "max_position_embeddings": 131072,
24
+ "model_type": "gemma3_text",
25
+ "num_attention_heads": 32,
26
+ "num_hidden_layers": 62,
27
+ "num_key_value_heads": 16,
28
+ "query_pre_attn_scalar": 168,
29
+ "rms_norm_eps": 1e-06,
30
+ "rope_local_base_freq": 10000.0,
31
+ "rope_scaling": {
32
+ "factor": 8.0,
33
+ "rope_type": "linear"
34
+ },
35
+ "rope_theta": 1000000.0,
36
+ "sliding_window": 1024,
37
+ "sliding_window_pattern": 6,
38
+ "torch_dtype": "float32",
39
+ "use_cache": false,
40
+ "vocab_size": 262208
41
+ },
42
+ "torch_dtype": "float32",
43
+ "transformers_version": "4.51.0.dev0",
44
+ "use_cache": true,
45
+ "vision_config": {
46
+ "attention_dropout": 0.0,
47
+ "hidden_act": "gelu_pytorch_tanh",
48
+ "hidden_size": 1152,
49
+ "image_size": 896,
50
+ "intermediate_size": 4304,
51
+ "layer_norm_eps": 1e-06,
52
+ "model_type": "siglip_vision_model",
53
+ "num_attention_heads": 16,
54
+ "num_channels": 3,
55
+ "num_hidden_layers": 27,
56
+ "patch_size": 14,
57
+ "torch_dtype": "float32",
58
+ "vision_use_head": false
59
+ }
60
+ }
generation_config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 2,
3
+ "cache_implementation": "hybrid",
4
+ "do_sample": true,
5
+ "eos_token_id": 106,
6
+ "pad_token_id": 0,
7
+ "top_k": 64,
8
+ "top_p": 0.95,
9
+ "transformers_version": "4.51.0.dev0",
10
+ "forced_eos_token_id": 106,
11
+ "length_penalty": -0.8,
12
+ "repetition_penalty": 1.1,
13
+ "temperature": 0.5,
14
+ "num_beams": 1,
15
+ "logit_bias": {
16
+ "106": 7.5
17
+ }
18
+
19
+ }
model-00001-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c84886fb6864f09bcd61f31ae2cdff868712ce21265b10ebb0076a408ab66fd3
3
+ size 23978903728
model-00002-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a45c1810df364638cfcd0385eb4783cb568535e6398573eccc5c347650a3267e
3
+ size 23716887688
model-00003-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:388735b9af45710c4f3a23b3cbc69bba4bd6fdecd86a3eb13acc54e9c39bcdd5
3
+ size 23584765560
model-00004-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bcbfa0e620917a76e138a1e3a40573fd822da50d1fd7c592fd62f2318690930
3
+ size 23849095088
model-00005-of-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67594b7e4a4c0cfaea539351885d119b118b161b06c0c6c45a98e8ac30df0eff
3
+ size 20238663280
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
preprocessor_config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": null,
3
+ "do_normalize": true,
4
+ "do_pan_and_scan": null,
5
+ "do_rescale": true,
6
+ "do_resize": true,
7
+ "image_mean": [
8
+ 0.5,
9
+ 0.5,
10
+ 0.5
11
+ ],
12
+ "image_processor_type": "Gemma3ImageProcessor",
13
+ "image_seq_length": 256,
14
+ "image_std": [
15
+ 0.5,
16
+ 0.5,
17
+ 0.5
18
+ ],
19
+ "pan_and_scan_max_num_crops": null,
20
+ "pan_and_scan_min_crop_size": null,
21
+ "pan_and_scan_min_ratio_to_activate": null,
22
+ "processor_class": "Gemma3Processor",
23
+ "resample": 2,
24
+ "rescale_factor": 0.00392156862745098,
25
+ "size": {
26
+ "height": 896,
27
+ "width": 896
28
+ }
29
+ }
processor_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "image_seq_length": 256,
3
+ "processor_class": "Gemma3Processor"
4
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ {
4
+ "content": "<end_of_turn>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ }
10
+ ],
11
+ "boi_token": "<start_of_image>",
12
+ "bos_token": {
13
+ "content": "<bos>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false
18
+ },
19
+ "eoi_token": "<end_of_image>",
20
+ "eos_token": {
21
+ "content": "<eos>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false
26
+ },
27
+ "image_token": "<image_soft_token>",
28
+ "pad_token": {
29
+ "content": "<pad>",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false
34
+ },
35
+ "unk_token": {
36
+ "content": "<unk>",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false
41
+ }
42
+ }
thai_space_tokens.json ADDED
@@ -0,0 +1,564 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "146159": " ง่าย",
3
+ "75315": " รู้",
4
+ "222431": " ราช",
5
+ "226080": " ราศี",
6
+ "126170": " เจอ",
7
+ "174982": " แค",
8
+ "85657": " พระ",
9
+ "105998": " เดี๋ยว",
10
+ "194671": " หัด",
11
+ "116062": " หาก",
12
+ "171961": " กราบ",
13
+ "42503": " เส",
14
+ "130481": " ใคร",
15
+ "27757": " ซ",
16
+ "190280": " ทอง",
17
+ "133337": " คํา",
18
+ "136040": " เฮ",
19
+ "111151": " หลัก",
20
+ "136835": " อื่น",
21
+ "110088": " อี",
22
+ "36031": " ผม",
23
+ "74551": " เขา",
24
+ "63348": " มั้ย",
25
+ "136192": " เดิม",
26
+ "92411": " พบ",
27
+ "128279": " ธ",
28
+ "152421": " ฟัง",
29
+ "208960": " หน่อย",
30
+ "164876": " ไอ้",
31
+ "93283": " ภาพ",
32
+ "140102": " ราคา",
33
+ "228169": " ประจํา",
34
+ "111706": " ดัง",
35
+ "108713": " แก",
36
+ "153882": " รี",
37
+ "169840": " เดือน",
38
+ "182019": " แปร",
39
+ "177679": " รถ",
40
+ "196676": " กำ",
41
+ "102747": " กํา",
42
+ "209224": " ปลา",
43
+ "19614": " ด",
44
+ "172128": " ใหญ่",
45
+ "22954": " อย",
46
+ "46940": " เนี่ย",
47
+ "232492": " หลังจาก",
48
+ "4307": " ค",
49
+ "31009": " กับ",
50
+ "79669": " ตอน",
51
+ "189213": " ชั่วโมง",
52
+ "27203": " กัน",
53
+ "229460": " เหมาะ",
54
+ "123953": " เปิด",
55
+ "78046": " นั้น",
56
+ "179031": " ชี",
57
+ "27396": " วัน",
58
+ "27657": " เข",
59
+ "176191": " จุด",
60
+ "38344": " มัน",
61
+ "194812": " จังหวัด",
62
+ "74714": " ถึง",
63
+ "32327": " คน",
64
+ "218537": " เหน",
65
+ "216063": " ฟรี",
66
+ "227901": " ชีวิต",
67
+ "79763": " ศ",
68
+ "29662": " ประ",
69
+ "199522": " แจ",
70
+ "109952": " ถูก",
71
+ "183169": " แสดง",
72
+ "87279": " เจ้า",
73
+ "218614": " นอน",
74
+ "127604": " ไทย",
75
+ "183726": " เรือ",
76
+ "107365": " ลง",
77
+ "137141": " บวก",
78
+ "200873": " ปุ่ม",
79
+ "200620": " วั",
80
+ "136671": " เพื่อน",
81
+ "121982": " เรียก",
82
+ "66626": " คร",
83
+ "164330": " กรรม",
84
+ "104642": " ละ",
85
+ "170509": " ทีม",
86
+ "207095": " ศูนย์",
87
+ "115135": " คู่",
88
+ "199229": " อุ",
89
+ "82454": " บาง",
90
+ "156232": " คิด",
91
+ "13793": " ก็",
92
+ "65524": " ลูก",
93
+ "78052": " ค่า",
94
+ "165978": " อนุ",
95
+ "213459": " ใด",
96
+ "73529": " ใหม่",
97
+ "16388": " ม",
98
+ "149873": " ขนาด",
99
+ "158057": " ล่ะ",
100
+ "20277": " แล้ว",
101
+ "93313": " เรีย",
102
+ "103111": " เดียว",
103
+ "156572": " สุด",
104
+ "150639": " คลิก",
105
+ "168722": " จน",
106
+ "167081": " กิน",
107
+ "64825": " ปี",
108
+ "106709": " รา",
109
+ "88811": " สําหรับ",
110
+ "12212": " ท",
111
+ "189330": " หมาย",
112
+ "236691": " สง",
113
+ "147329": " กู",
114
+ "194002": " ปก",
115
+ "70846": " ขึ้น",
116
+ "130682": " หนึ่ง",
117
+ "130196": " เฉ",
118
+ "155620": " สาว",
119
+ "156707": " แห่ง",
120
+ "93607": " นั่น",
121
+ "23476": " ป",
122
+ "175697": " เพียง",
123
+ "97624": " กด",
124
+ "109374": " โอเค",
125
+ "127596": " ส่ง",
126
+ "200625": " เหรอ",
127
+ "53249": " เพราะ",
128
+ "83068": " จำ",
129
+ "51944": " เช",
130
+ "172499": " คง",
131
+ "176313": " สอบ",
132
+ "150149": " พวก",
133
+ "172809": " เนื่อง",
134
+ "25649": " เพ",
135
+ "64925": " อ่ะ",
136
+ "107905": " หลัง",
137
+ "132460": " ดาว",
138
+ "234076": " ถนน",
139
+ "83651": " รับ",
140
+ "127592": " แบ่ง",
141
+ "90761": " ตั้ง",
142
+ "120198": " หัว",
143
+ "105792": " เต",
144
+ "229381": " ชอบ",
145
+ "144230": " จํานวน",
146
+ "162660": " ภาษา",
147
+ "112086": " แห",
148
+ "207268": " กลุ่ม",
149
+ "38902": " เม",
150
+ "195767": " ณ",
151
+ "211662": " พิ",
152
+ "120897": " ห้อง",
153
+ "100800": " น้อย",
154
+ "231875": " งวด",
155
+ "109313": " ชื่อ",
156
+ "112822": " รัก",
157
+ "130116": " แม",
158
+ "222079": " บุ",
159
+ "176389": " พิจ",
160
+ "61497": " อัน",
161
+ "48250": " ซึ่ง",
162
+ "72596": " บ้าน",
163
+ "210753": " แอป",
164
+ "66826": " เป",
165
+ "68225": " ดี",
166
+ "33639": " ค่ะ",
167
+ "65380": " หา",
168
+ "105009": " ไว้",
169
+ "233979": " พิจิก",
170
+ "131043": " วิธี",
171
+ "115180": " เปลี่ยน",
172
+ "45079": " ทํา",
173
+ "196479": " รอบ",
174
+ "61472": " ใช้",
175
+ "209262": " สัก",
176
+ "103805": " ใจ",
177
+ "79106": " ฮะ",
178
+ "209984": " หนังสือ",
179
+ "196924": " ดิ",
180
+ "10265": " ห",
181
+ "207418": " จง",
182
+ "20649": " มี",
183
+ "208643": " หน่วย",
184
+ "29043": " ตัว",
185
+ "85705": " ฝ",
186
+ "16798": " นี้",
187
+ "123823": " หมด",
188
+ "145941": " ประกอบ",
189
+ "173008": " จด",
190
+ "45272": " ข้อ",
191
+ "234986": " ไข",
192
+ "182165": " พัน",
193
+ "198064": " หนู",
194
+ "17122": " ร",
195
+ "91623": " คลิป",
196
+ "45970": " นัก",
197
+ "51443": " ต้อง",
198
+ "123291": " ประเภท",
199
+ "226410": " คอม",
200
+ "143231": " โปร",
201
+ "163991": " ใบ",
202
+ "117233": " เอ่อ",
203
+ "226910": " อำ",
204
+ "82087": " สม",
205
+ "131870": " กว่า",
206
+ "23474": " ย",
207
+ "235303": " ทด",
208
+ "14881": " มา",
209
+ "216397": " ร่วม",
210
+ "181781": " เพิ่ม",
211
+ "223221": " เชื่อ",
212
+ "196553": " แพ",
213
+ "166864": " จัก",
214
+ "122656": " เล่น",
215
+ "177432": " เฟ",
216
+ "181054": " ชาว",
217
+ "180740": " ไหม",
218
+ "52723": " เนาะ",
219
+ "169153": " ผ่าน",
220
+ "195663": " ตุ",
221
+ "82257": " ใส่",
222
+ "54046": " อย่าง",
223
+ "83194": " ทาง",
224
+ "52864": " ครู",
225
+ "46282": " อะไร",
226
+ "214400": " เฉล",
227
+ "54374": " หน้า",
228
+ "59799": " โอ",
229
+ "141676": " ลอง",
230
+ "108264": " พา",
231
+ "134698": " สร้าง",
232
+ "5363": " ก",
233
+ "57917": " ก่อน",
234
+ "102683": " ถาม",
235
+ "153392": " น่ะ",
236
+ "109053": " กร",
237
+ "151692": " เป้า",
238
+ "119969": " แม่",
239
+ "97532": " เครื่อง",
240
+ "94658": " คณิต",
241
+ "175533": " อยาก",
242
+ "116873": " ชั้น",
243
+ "211162": " อิ",
244
+ "211428": " สิน",
245
+ "181437": " คูณ",
246
+ "78177": " สํา",
247
+ "203098": " สมการ",
248
+ "55632": " ฮ",
249
+ "104606": " แท",
250
+ "90262": " มาก",
251
+ "219664": " นาที",
252
+ "24053": " ถ",
253
+ "166968": " ผ้า",
254
+ "22675": " เล",
255
+ "216718": " กี่",
256
+ "190608": " ข้าง",
257
+ "71608": " อาจ",
258
+ "47416": " วิ",
259
+ "208917": " เอก",
260
+ "149905": " ประเทศ",
261
+ "116957": " ช่วย",
262
+ "123225": " เขียน",
263
+ "128295": " ประก",
264
+ "223440": " ไล",
265
+ "121255": " จึง",
266
+ "159012": " นับ",
267
+ "112408": " แน",
268
+ "83516": " ฉ",
269
+ "157963": " ฝึก",
270
+ "139153": " สะ",
271
+ "135819": " กําลัง",
272
+ "65601": " ทั้ง",
273
+ "69077": " น้อง",
274
+ "218493": " เตรียม",
275
+ "185962": " นา",
276
+ "31701": " คือ",
277
+ "20271": " ได้",
278
+ "196499": " ลํา",
279
+ "80450": " ด้าน",
280
+ "90798": " ชม",
281
+ "42328": " เก",
282
+ "81612": " ทำ",
283
+ "19856": " ล",
284
+ "172305": " ต้องการ",
285
+ "83289": " กระ",
286
+ "182238": " สา",
287
+ "175278": " นอกจาก",
288
+ "56205": " ง",
289
+ "49126": " ทุก",
290
+ "230312": " หยุด",
291
+ "157131": " ตัด",
292
+ "18525": " ผ",
293
+ "202178": " มอง",
294
+ "6228": " แ",
295
+ "86479": " สูตร",
296
+ "115332": " ต้น",
297
+ "42650": " จาก",
298
+ "137546": " กลับ",
299
+ "9189": " นะ",
300
+ "130962": " อ่าน",
301
+ "95944": " เกิด",
302
+ "192715": " หมู่",
303
+ "195449": " เคย",
304
+ "220526": " กรณี",
305
+ "86851": " เห็น",
306
+ "229371": " เดิน",
307
+ "233067": " อิน",
308
+ "229711": " เวอร์ชั่น",
309
+ "226930": " แก้",
310
+ "11603": " ที่",
311
+ "47716": " เอ",
312
+ "23192": " ไป",
313
+ "33719": " เด",
314
+ "109098": " สำหรับ",
315
+ "186725": " ยาก",
316
+ "227259": " กี้",
317
+ "63168": " สวัสดี",
318
+ "57642": " แบบ",
319
+ "57114": " นี่",
320
+ "120696": " ต่าง",
321
+ "152936": " ยาว",
322
+ "15912": " จะ",
323
+ "175151": " ระบบ",
324
+ "163558": " ไหร่",
325
+ "199468": " เมือง",
326
+ "113298": " คณิตศาสตร์",
327
+ "40802": " ดู",
328
+ "196503": " บริษัท",
329
+ "227312": " รวมถึง",
330
+ "7276": " อ",
331
+ "55953": " เว",
332
+ "27831": " ให้",
333
+ "188998": " มิถุนายน",
334
+ "68252": " ต่อ",
335
+ "8264": " ส",
336
+ "85138": " ใช่",
337
+ "223286": " เงี้ย",
338
+ "229868": " แชร์",
339
+ "199022": " ไม่มี",
340
+ "192629": " จํา",
341
+ "31072": " หน",
342
+ "100177": " บริ",
343
+ "171668": " เกม",
344
+ "214683": " ออนไลน์",
345
+ "217590": " นาง",
346
+ "192645": " แต",
347
+ "100612": " นํา",
348
+ "56583": " อ่า",
349
+ "230779": " ตำ",
350
+ "24366": " ไม่",
351
+ "116588": " เหมือน",
352
+ "224328": " แยก",
353
+ "63429": " ไฟ",
354
+ "148135": " น้ำ",
355
+ "75662": " พร้อม",
356
+ "111034": " ประมาณ",
357
+ "210960": " ดังนั้น",
358
+ "114885": " จำกัด",
359
+ "199073": " ฉาก",
360
+ "215492": " รุ่น",
361
+ "228266": " สาม",
362
+ "107374": " ราย",
363
+ "155325": " เศษ",
364
+ "190499": " ขณะ",
365
+ "222019": " สิง",
366
+ "52364": " ผู้",
367
+ "208174": " เวอร์",
368
+ "133133": " เศ",
369
+ "122301": " ระยะ",
370
+ "7749": " ไ",
371
+ "125051": " มุม",
372
+ "235343": " ขาย",
373
+ "134379": " บน",
374
+ "151258": " ไม",
375
+ "206366": " ช่อง",
376
+ "81825": " ผล",
377
+ "138311": " เออ",
378
+ "211415": " ขั้น",
379
+ "86627": " สำ",
380
+ "89111": " สามารถ",
381
+ "146788": " หาร",
382
+ "37782": " หรือ",
383
+ "22301": " ว่า",
384
+ "156239": " เด้อ",
385
+ "234663": " แถม",
386
+ "44216": " เข้า",
387
+ "108492": " ฟ้า",
388
+ "3157": " เ",
389
+ "119481": " ไง",
390
+ "144338": " สืบค้นเมื่อ",
391
+ "39759": " โดย",
392
+ "16450": " ข",
393
+ "110554": " สี",
394
+ "4838": " น",
395
+ "20007": " เรา",
396
+ "99997": " ติด",
397
+ "37098": " อยู่",
398
+ "207224": " ลด",
399
+ "235157": " ครอง",
400
+ "224056": " ตุลาคม",
401
+ "56764": " กล",
402
+ "200643": " เต็ม",
403
+ "234992": " สาย",
404
+ "158420": " รอง",
405
+ "12621": " พ",
406
+ "33347": " เรียน",
407
+ "22386": " ๆ",
408
+ "35097": " เน",
409
+ "75629": " เท่า",
410
+ "70342": " ท่าน",
411
+ "19302": " ช",
412
+ "175304": " แอ",
413
+ "103762": " ตอบ",
414
+ "150927": " โอ้",
415
+ "49107": " เรื่อง",
416
+ "210042": " ร้าน",
417
+ "227462": " ควร",
418
+ "156589": " ช่วง",
419
+ "109438": " หลาย",
420
+ "42106": " ใ",
421
+ "144695": " บ่",
422
+ "88887": " พอ",
423
+ "143072": " สืบค้น",
424
+ "49283": " เห",
425
+ "142153": " ล้าน",
426
+ "185996": " แนว",
427
+ "94745": " รูป",
428
+ "68791": " คลิ",
429
+ "210925": " จำนวน",
430
+ "69916": " เบ",
431
+ "18796": " การ",
432
+ "153012": " นิ",
433
+ "152321": " โม",
434
+ "175184": " หย",
435
+ "50530": " อา",
436
+ "124310": " มือ",
437
+ "31732": " แต่",
438
+ "62304": " อีก",
439
+ "115918": " แรก",
440
+ "183060": " ดวง",
441
+ "130652": " มิ",
442
+ "173947": " เหลือ",
443
+ "58777": " ระ",
444
+ "185149": " เก็บ",
445
+ "78093": " ตรง",
446
+ "53376": " พี่",
447
+ "60877": " เอา",
448
+ "77840": " บอก",
449
+ "148487": " ทำให้",
450
+ "225158": " โจทย์",
451
+ "186439": " เธอ",
452
+ "171647": " อืม",
453
+ "151247": " มูล",
454
+ "235802": " เนื่องจาก",
455
+ "208592": " โร",
456
+ "162837": " เลือก",
457
+ "188460": " จับ",
458
+ "10249": " ครับ",
459
+ "62685": " เมื่อ",
460
+ "129480": " เค",
461
+ "45878": " ฟ",
462
+ "230176": " คำ",
463
+ "70630": " หม",
464
+ "155813": " แนะ",
465
+ "78357": " ที",
466
+ "131814": " นึง",
467
+ "83498": " ตาม",
468
+ "52499": " คุณ",
469
+ "169806": " เกี่ยว",
470
+ "133824": " ตา",
471
+ "113932": " แรง",
472
+ "94099": " สน",
473
+ "220048": " เมตร",
474
+ "16262": " ว",
475
+ "97070": " บาท",
476
+ "174669": " เก็",
477
+ "94862": " รวม",
478
+ "43122": " เร",
479
+ "48435": " ด้วย",
480
+ "189523": " พระเจ้า",
481
+ "130714": " สื",
482
+ "147125": " จริง",
483
+ "9879": " ต",
484
+ "196238": " วัด",
485
+ "97452": " สอน",
486
+ "69414": " ขอ",
487
+ "135022": " สิ่ง",
488
+ "163171": " เง",
489
+ "188579": " เสียง",
490
+ "151482": " บท",
491
+ "201170": " อาท",
492
+ "80544": " เวลา",
493
+ "213124": " แล",
494
+ "19304": " ใน",
495
+ "158428": " พื้น",
496
+ "127257": " อย่า",
497
+ "122669": " โรง",
498
+ "114140": " เซ",
499
+ "89317": " เด็ก",
500
+ "15515": " บ",
501
+ "17555": " เป็น",
502
+ "112763": " สิ",
503
+ "131023": " ครั้ง",
504
+ "117795": " น้ํา",
505
+ "77777": " งาน",
506
+ "178424": " ยก",
507
+ "203932": " สถาน",
508
+ "117461": " เย",
509
+ "14675": " โ",
510
+ "166497": " คว",
511
+ "109145": " เริ่ม",
512
+ "49804": " เท",
513
+ "163711": " เสร็จ",
514
+ "23327": " ของ",
515
+ "226836": " ร้อย",
516
+ "9321": " จ",
517
+ "78135": " สู",
518
+ "137046": " รอ",
519
+ "162777": " คะแนน",
520
+ "55120": " ส่วน",
521
+ "64401": " ออก",
522
+ "99307": " เช่น",
523
+ "189437": " ตาย",
524
+ "198104": " บ้าง",
525
+ "47860": " ���พื่อ",
526
+ "79107": " เลข",
527
+ "49706": " ยัง",
528
+ "230456": " ด่า",
529
+ "18685": " คะ",
530
+ "221187": " อังกฤษ",
531
+ "38364": " เลย",
532
+ "225512": " เยอะ",
533
+ "102469": " เหล",
534
+ "191086": " แทน",
535
+ "80482": " วิชา",
536
+ "163980": " ชุด",
537
+ "135638": " ขวด",
538
+ "114412": " ไหน",
539
+ "163577": " ลักษณะ",
540
+ "135429": " ไฟล์",
541
+ "172483": " กล่าว",
542
+ "213077": " กม",
543
+ "18389": " และ",
544
+ "118423": " เส้น",
545
+ "108666": " พูด",
546
+ "160186": " เนื้อ",
547
+ "164190": " เงิน",
548
+ "138752": " ไอ",
549
+ "212038": " เด่น",
550
+ "56023": " ถ้า",
551
+ "116435": " จัด",
552
+ "126557": " เอง",
553
+ "215573": " เหตุ",
554
+ "118771": " อาจารย์",
555
+ "51564": " เจ",
556
+ "231876": " นิด",
557
+ "126099": " สนาม",
558
+ "219542": " อายุ",
559
+ "46979": " ความ",
560
+ "56146": " หล",
561
+ "172046": " แปล",
562
+ "105574": " น่า",
563
+ "128001": " นาย"
564
+ }
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1299c11d7cf632ef3b4e11937501358ada021bbdf7c47638d13c0ee982f2e79c
3
+ size 4689074
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff