de-Rodrigo commited on
Commit
6174ab0
·
verified ·
1 Parent(s): b766d52

Training done

Browse files
Files changed (4) hide show
  1. README.md +3 -0
  2. added_tokens.json +4 -4
  3. tokenizer.json +4 -4
  4. tokenizer_config.json +4 -4
README.md CHANGED
@@ -1,3 +1,6 @@
 
 
 
1
  # DONUT Merit
2
 
3
  <a href="https://x.com/nearcyan/status/1706914605262684394">
 
1
+ ---
2
+ {}
3
+ ---
4
  # DONUT Merit
5
 
6
  <a href="https://x.com/nearcyan/status/1706914605262684394">
added_tokens.json CHANGED
@@ -2,8 +2,8 @@
2
  "</s_grade>": 57530,
3
  "</s_subject>": 57528,
4
  "</s_year_10>": 57532,
5
- "</s_year_11>": 57534,
6
- "</s_year_12>": 57536,
7
  "</s_year_9>": 57526,
8
  "<s_cord-v2>": 57537,
9
  "<s_grade>": 57529,
@@ -11,8 +11,8 @@
11
  "<s_subject>": 57527,
12
  "<s_synthdog>": 57524,
13
  "<s_year_10>": 57531,
14
- "<s_year_11>": 57533,
15
- "<s_year_12>": 57535,
16
  "<s_year_9>": 57525,
17
  "<sep/>": 57522
18
  }
 
2
  "</s_grade>": 57530,
3
  "</s_subject>": 57528,
4
  "</s_year_10>": 57532,
5
+ "</s_year_11>": 57536,
6
+ "</s_year_12>": 57534,
7
  "</s_year_9>": 57526,
8
  "<s_cord-v2>": 57537,
9
  "<s_grade>": 57529,
 
11
  "<s_subject>": 57527,
12
  "<s_synthdog>": 57524,
13
  "<s_year_10>": 57531,
14
+ "<s_year_11>": 57535,
15
+ "<s_year_12>": 57533,
16
  "<s_year_9>": 57525,
17
  "<sep/>": 57522
18
  }
tokenizer.json CHANGED
@@ -149,7 +149,7 @@
149
  },
150
  {
151
  "id": 57533,
152
- "content": "<s_year_11>",
153
  "single_word": false,
154
  "lstrip": false,
155
  "rstrip": false,
@@ -158,7 +158,7 @@
158
  },
159
  {
160
  "id": 57534,
161
- "content": "</s_year_11>",
162
  "single_word": false,
163
  "lstrip": false,
164
  "rstrip": false,
@@ -167,7 +167,7 @@
167
  },
168
  {
169
  "id": 57535,
170
- "content": "<s_year_12>",
171
  "single_word": false,
172
  "lstrip": false,
173
  "rstrip": false,
@@ -176,7 +176,7 @@
176
  },
177
  {
178
  "id": 57536,
179
- "content": "</s_year_12>",
180
  "single_word": false,
181
  "lstrip": false,
182
  "rstrip": false,
 
149
  },
150
  {
151
  "id": 57533,
152
+ "content": "<s_year_12>",
153
  "single_word": false,
154
  "lstrip": false,
155
  "rstrip": false,
 
158
  },
159
  {
160
  "id": 57534,
161
+ "content": "</s_year_12>",
162
  "single_word": false,
163
  "lstrip": false,
164
  "rstrip": false,
 
167
  },
168
  {
169
  "id": 57535,
170
+ "content": "<s_year_11>",
171
  "single_word": false,
172
  "lstrip": false,
173
  "rstrip": false,
 
176
  },
177
  {
178
  "id": 57536,
179
+ "content": "</s_year_11>",
180
  "single_word": false,
181
  "lstrip": false,
182
  "rstrip": false,
tokenizer_config.json CHANGED
@@ -129,7 +129,7 @@
129
  "special": false
130
  },
131
  "57533": {
132
- "content": "<s_year_11>",
133
  "lstrip": false,
134
  "normalized": true,
135
  "rstrip": false,
@@ -137,7 +137,7 @@
137
  "special": false
138
  },
139
  "57534": {
140
- "content": "</s_year_11>",
141
  "lstrip": false,
142
  "normalized": true,
143
  "rstrip": false,
@@ -145,7 +145,7 @@
145
  "special": false
146
  },
147
  "57535": {
148
- "content": "<s_year_12>",
149
  "lstrip": false,
150
  "normalized": true,
151
  "rstrip": false,
@@ -153,7 +153,7 @@
153
  "special": false
154
  },
155
  "57536": {
156
- "content": "</s_year_12>",
157
  "lstrip": false,
158
  "normalized": true,
159
  "rstrip": false,
 
129
  "special": false
130
  },
131
  "57533": {
132
+ "content": "<s_year_12>",
133
  "lstrip": false,
134
  "normalized": true,
135
  "rstrip": false,
 
137
  "special": false
138
  },
139
  "57534": {
140
+ "content": "</s_year_12>",
141
  "lstrip": false,
142
  "normalized": true,
143
  "rstrip": false,
 
145
  "special": false
146
  },
147
  "57535": {
148
+ "content": "<s_year_11>",
149
  "lstrip": false,
150
  "normalized": true,
151
  "rstrip": false,
 
153
  "special": false
154
  },
155
  "57536": {
156
+ "content": "</s_year_11>",
157
  "lstrip": false,
158
  "normalized": true,
159
  "rstrip": false,