Ben10x commited on
Commit
0e5edd1
·
verified ·
1 Parent(s): 78e15bb

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -47,144 +47,226 @@
47
  "gradient_checkpointing": false,
48
  "hidden_size": 2048,
49
  "id2label": {
50
- "0": "B-T048",
51
- "1": "B-T047",
52
- "2": "I-T074",
53
- "3": "I-T170",
54
- "4": "I-O",
55
- "5": "I-T033",
56
- "6": "B-T091",
57
- "7": "B-T037",
58
- "8": "I-T020",
59
- "9": "B-T082",
60
- "10": "B-T074",
61
- "11": "B-T092",
62
- "12": "I-T091",
63
- "13": "I-T092",
64
- "14": "B-T116",
65
- "15": "B-T169",
66
- "16": "I-T046",
67
- "17": "I-T116",
68
- "18": "I-T191",
69
- "19": "I-T022",
70
- "20": "I-T028",
71
- "21": "I-T019",
72
- "22": "B-T005",
73
- "23": "B-T170",
74
- "24": "B-T168",
75
  "25": "I-T168",
76
- "26": "I-T031",
77
- "27": "I-T129",
78
- "28": "B-T031",
79
- "29": "I-T103",
80
- "30": "B-T019",
81
- "31": "B-T129",
82
- "32": "B-T058",
83
- "33": "B-O",
84
- "34": "B-T190",
85
- "35": "B-T204",
86
- "36": "I-T184",
87
- "37": "B-T191",
88
- "38": "B-T022",
89
- "39": "B-T201",
90
- "40": "I-T058",
91
- "41": "B-T046",
92
- "42": "B-T098",
93
- "43": "I-T201",
94
- "44": "I-T005",
95
- "45": "I-T037",
96
- "46": "B-T033",
97
- "47": "I-T062",
98
- "48": "I-T097",
99
- "49": "B-T184",
100
- "50": "B-T028",
101
- "51": "I-T038",
102
- "52": "I-T204",
103
  "53": "I-T047",
104
- "54": "I-T082",
105
- "55": "I-T098",
106
- "56": "B-T007",
107
- "57": "B-T038",
108
- "58": "B-T097",
109
- "59": "I-T048",
110
- "60": "I-T017",
111
- "61": "B-T020",
112
- "62": "B-T062",
113
- "63": "O",
114
- "64": "I-T007",
115
- "65": "B-T103",
116
- "66": "B-T017"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
117
  },
118
  "initializer_range": 0.02,
119
  "intermediate_size": null,
120
  "label2id": {
121
- "B-O": 33,
122
- "B-T005": 22,
123
- "B-T007": 56,
124
- "B-T017": 66,
125
- "B-T019": 30,
126
- "B-T020": 61,
127
- "B-T022": 38,
128
- "B-T028": 50,
129
- "B-T031": 28,
130
- "B-T033": 46,
131
- "B-T037": 7,
132
- "B-T038": 57,
133
- "B-T046": 41,
134
- "B-T047": 1,
135
- "B-T048": 0,
136
- "B-T058": 32,
137
- "B-T062": 62,
138
- "B-T074": 10,
139
- "B-T082": 9,
140
- "B-T091": 6,
141
- "B-T092": 11,
142
- "B-T097": 58,
143
- "B-T098": 42,
144
- "B-T103": 65,
145
- "B-T116": 14,
146
- "B-T129": 31,
147
- "B-T168": 24,
148
- "B-T169": 15,
149
- "B-T170": 23,
150
- "B-T184": 49,
151
- "B-T190": 34,
152
- "B-T191": 37,
153
- "B-T201": 39,
154
- "B-T204": 35,
155
- "I-O": 4,
156
- "I-T005": 44,
157
- "I-T007": 64,
158
- "I-T017": 60,
159
- "I-T019": 21,
160
- "I-T020": 8,
161
- "I-T022": 19,
162
- "I-T028": 20,
163
- "I-T031": 26,
164
- "I-T033": 5,
165
- "I-T037": 45,
166
- "I-T038": 51,
167
- "I-T046": 16,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
168
  "I-T047": 53,
169
- "I-T048": 59,
170
- "I-T058": 40,
171
- "I-T062": 47,
172
- "I-T074": 2,
173
- "I-T082": 54,
174
- "I-T091": 12,
175
- "I-T092": 13,
176
- "I-T097": 48,
177
- "I-T098": 55,
178
- "I-T103": 29,
179
- "I-T116": 17,
180
- "I-T129": 27,
 
 
 
 
 
 
 
 
181
  "I-T168": 25,
182
- "I-T170": 3,
183
- "I-T184": 36,
184
- "I-T191": 18,
185
- "I-T201": 43,
186
- "I-T204": 52,
187
- "O": 63
 
188
  },
189
  "layer_norm_epsilon": 1e-05,
190
  "max_position_embeddings": 2048,
 
47
  "gradient_checkpointing": false,
48
  "hidden_size": 2048,
49
  "id2label": {
50
+ "0": "B-T081",
51
+ "1": "B-T037",
52
+ "2": "I-T020",
53
+ "3": "B-T020",
54
+ "4": "I-T026",
55
+ "5": "B-T170",
56
+ "6": "B-T070",
57
+ "7": "I-T170",
58
+ "8": "B-T028",
59
+ "9": "I-T082",
60
+ "10": "B-T017",
61
+ "11": "I-T044",
62
+ "12": "B-T196",
63
+ "13": "I-T091",
64
+ "14": "B-T025",
65
+ "15": "I-T058",
66
+ "16": "B-T024",
67
+ "17": "B-T033",
68
+ "18": "B-T129",
69
+ "19": "I-T037",
70
+ "20": "I-T074",
71
+ "21": "B-T041",
72
+ "22": "B-T191",
73
+ "23": "B-T022",
74
+ "24": "I-T007",
75
  "25": "I-T168",
76
+ "26": "I-T043",
77
+ "27": "I-T098",
78
+ "28": "B-T048",
79
+ "29": "B-T098",
80
+ "30": "B-T082",
81
+ "31": "I-T033",
82
+ "32": "B-T091",
83
+ "33": "I-T190",
84
+ "34": "B-T045",
85
+ "35": "I-T097",
86
+ "36": "B-T167",
87
+ "37": "I-T045",
88
+ "38": "B-T023",
89
+ "39": "I-T109",
90
+ "40": "B-T080",
91
+ "41": "B-T097",
92
+ "42": "I-T039",
93
+ "43": "B-T043",
94
+ "44": "B-T116",
95
+ "45": "I-T129",
96
+ "46": "B-T092",
97
+ "47": "B-T026",
98
+ "48": "I-T041",
99
+ "49": "B-T040",
100
+ "50": "B-T074",
101
+ "51": "B-T062",
102
+ "52": "I-T025",
103
  "53": "I-T047",
104
+ "54": "B-T201",
105
+ "55": "B-T109",
106
+ "56": "B-T031",
107
+ "57": "B-T197",
108
+ "58": "I-T005",
109
+ "59": "I-T062",
110
+ "60": "B-T063",
111
+ "61": "B-T114",
112
+ "62": "B-T038",
113
+ "63": "B-T058",
114
+ "64": "I-T121",
115
+ "65": "I-T092",
116
+ "66": "I-T048",
117
+ "67": "I-T204",
118
+ "68": "I-T191",
119
+ "69": "I-T201",
120
+ "70": "B-T123",
121
+ "71": "I-T038",
122
+ "72": "B-T104",
123
+ "73": "O",
124
+ "74": "I-T017",
125
+ "75": "I-T114",
126
+ "76": "I-T019",
127
+ "77": "I-T022",
128
+ "78": "I-T031",
129
+ "79": "B-T007",
130
+ "80": "I-T063",
131
+ "81": "B-T039",
132
+ "82": "B-T047",
133
+ "83": "B-T103",
134
+ "84": "I-T046",
135
+ "85": "I-T116",
136
+ "86": "I-T024",
137
+ "87": "B-T059",
138
+ "88": "B-T204",
139
+ "89": "I-T125",
140
+ "90": "B-T121",
141
+ "91": "B-T044",
142
+ "92": "B-T184",
143
+ "93": "B-T190",
144
+ "94": "I-T028",
145
+ "95": "I-T023",
146
+ "96": "B-T168",
147
+ "97": "B-T046",
148
+ "98": "B-T019",
149
+ "99": "B-T125",
150
+ "100": "I-T184",
151
+ "101": "I-T059",
152
+ "102": "B-T169",
153
+ "103": "I-T070",
154
+ "104": "B-T131",
155
+ "105": "I-T167",
156
+ "106": "I-T103",
157
+ "107": "B-T005"
158
  },
159
  "initializer_range": 0.02,
160
  "intermediate_size": null,
161
  "label2id": {
162
+ "B-T005": 107,
163
+ "B-T007": 79,
164
+ "B-T017": 10,
165
+ "B-T019": 98,
166
+ "B-T020": 3,
167
+ "B-T022": 23,
168
+ "B-T023": 38,
169
+ "B-T024": 16,
170
+ "B-T025": 14,
171
+ "B-T026": 47,
172
+ "B-T028": 8,
173
+ "B-T031": 56,
174
+ "B-T033": 17,
175
+ "B-T037": 1,
176
+ "B-T038": 62,
177
+ "B-T039": 81,
178
+ "B-T040": 49,
179
+ "B-T041": 21,
180
+ "B-T043": 43,
181
+ "B-T044": 91,
182
+ "B-T045": 34,
183
+ "B-T046": 97,
184
+ "B-T047": 82,
185
+ "B-T048": 28,
186
+ "B-T058": 63,
187
+ "B-T059": 87,
188
+ "B-T062": 51,
189
+ "B-T063": 60,
190
+ "B-T070": 6,
191
+ "B-T074": 50,
192
+ "B-T080": 40,
193
+ "B-T081": 0,
194
+ "B-T082": 30,
195
+ "B-T091": 32,
196
+ "B-T092": 46,
197
+ "B-T097": 41,
198
+ "B-T098": 29,
199
+ "B-T103": 83,
200
+ "B-T104": 72,
201
+ "B-T109": 55,
202
+ "B-T114": 61,
203
+ "B-T116": 44,
204
+ "B-T121": 90,
205
+ "B-T123": 70,
206
+ "B-T125": 99,
207
+ "B-T129": 18,
208
+ "B-T131": 104,
209
+ "B-T167": 36,
210
+ "B-T168": 96,
211
+ "B-T169": 102,
212
+ "B-T170": 5,
213
+ "B-T184": 92,
214
+ "B-T190": 93,
215
+ "B-T191": 22,
216
+ "B-T196": 12,
217
+ "B-T197": 57,
218
+ "B-T201": 54,
219
+ "B-T204": 88,
220
+ "I-T005": 58,
221
+ "I-T007": 24,
222
+ "I-T017": 74,
223
+ "I-T019": 76,
224
+ "I-T020": 2,
225
+ "I-T022": 77,
226
+ "I-T023": 95,
227
+ "I-T024": 86,
228
+ "I-T025": 52,
229
+ "I-T026": 4,
230
+ "I-T028": 94,
231
+ "I-T031": 78,
232
+ "I-T033": 31,
233
+ "I-T037": 19,
234
+ "I-T038": 71,
235
+ "I-T039": 42,
236
+ "I-T041": 48,
237
+ "I-T043": 26,
238
+ "I-T044": 11,
239
+ "I-T045": 37,
240
+ "I-T046": 84,
241
  "I-T047": 53,
242
+ "I-T048": 66,
243
+ "I-T058": 15,
244
+ "I-T059": 101,
245
+ "I-T062": 59,
246
+ "I-T063": 80,
247
+ "I-T070": 103,
248
+ "I-T074": 20,
249
+ "I-T082": 9,
250
+ "I-T091": 13,
251
+ "I-T092": 65,
252
+ "I-T097": 35,
253
+ "I-T098": 27,
254
+ "I-T103": 106,
255
+ "I-T109": 39,
256
+ "I-T114": 75,
257
+ "I-T116": 85,
258
+ "I-T121": 64,
259
+ "I-T125": 89,
260
+ "I-T129": 45,
261
+ "I-T167": 105,
262
  "I-T168": 25,
263
+ "I-T170": 7,
264
+ "I-T184": 100,
265
+ "I-T190": 33,
266
+ "I-T191": 68,
267
+ "I-T201": 69,
268
+ "I-T204": 67,
269
+ "O": 73
270
  },
271
  "layer_norm_epsilon": 1e-05,
272
  "max_position_embeddings": 2048,
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0863e6d4b28b59b1f72ebd59ab57d0875600501f34c708ce51a0209372d6dcf8
3
  size 4993794184
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6556a1872666cc0d281e9049f5fe524a72689361e9758a42bff06f247cc031dd
3
  size 4993794184
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1a0158cd87c5a5a252e3b9f5405755016e97a5e33df04072558b01478c76168
3
- size 269093076
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ad2d54d1e79dd330afca71cb34ec72427cc3d07f76f4b69b83a1c89adfef6a2
3
+ size 269429120
model.safetensors.index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "metadata": {
3
- "total_size": 5262852364
4
  },
5
  "weight_map": {
6
  "classifier.bias": "model-00002-of-00002.safetensors",
 
1
  {
2
  "metadata": {
3
+ "total_size": 5263188400
4
  },
5
  "weight_map": {
6
  "classifier.bias": "model-00002-of-00002.safetensors",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15e870b02362c8358020cdb3e08e732ac441d88177d547d09bed34305e8d228d
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aca836050c94f1c9e52e21c4a73b3318d10be3b79a3bc4c4ff8cd09eeeba963a
3
  size 5368