Ben10x commited on
Commit
ba84a90
·
verified ·
1 Parent(s): 7037635

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -47,226 +47,226 @@
47
  "gradient_checkpointing": false,
48
  "hidden_size": 2048,
49
  "id2label": {
50
- "0": "B-T023",
51
- "1": "I-T044",
52
- "2": "I-T074",
53
- "3": "I-T109",
54
- "4": "I-T114",
55
- "5": "B-T005",
56
- "6": "B-T058",
57
- "7": "B-T114",
58
- "8": "B-T097",
59
- "9": "I-T063",
60
- "10": "B-T062",
61
- "11": "I-T033",
62
- "12": "B-T082",
63
- "13": "B-T019",
64
- "14": "I-T097",
65
- "15": "I-T168",
66
- "16": "B-T081",
67
- "17": "I-T048",
68
- "18": "B-T040",
69
  "19": "B-T044",
70
- "20": "I-T125",
71
- "21": "B-T129",
72
- "22": "I-T167",
73
- "23": "B-T026",
74
- "24": "I-T121",
75
- "25": "B-T043",
76
- "26": "I-T059",
77
- "27": "B-T190",
78
- "28": "I-T007",
79
- "29": "B-T080",
80
- "30": "I-T028",
81
- "31": "I-T005",
82
- "32": "I-T092",
83
- "33": "B-T116",
84
- "34": "I-T037",
85
- "35": "I-T191",
86
- "36": "B-T025",
87
- "37": "B-T048",
88
- "38": "I-T031",
89
- "39": "B-T170",
90
- "40": "B-T098",
91
- "41": "I-T041",
92
- "42": "I-T204",
93
- "43": "B-T197",
94
- "44": "B-T046",
95
- "45": "I-T184",
96
- "46": "I-T026",
97
- "47": "B-T007",
98
- "48": "B-T045",
99
- "49": "I-T047",
100
  "50": "B-T104",
101
- "51": "I-T045",
102
- "52": "I-T103",
103
- "53": "I-T190",
104
- "54": "I-T201",
105
- "55": "I-T129",
106
- "56": "I-T082",
107
- "57": "B-T123",
108
- "58": "B-T024",
109
- "59": "I-T025",
110
- "60": "B-T059",
111
- "61": "B-T204",
112
- "62": "B-T041",
113
- "63": "B-T070",
114
- "64": "B-T131",
115
- "65": "B-T037",
116
- "66": "B-T121",
117
- "67": "B-T039",
118
- "68": "B-T169",
119
- "69": "B-T074",
120
- "70": "B-T191",
121
- "71": "B-T125",
122
- "72": "I-T116",
123
- "73": "I-T070",
124
- "74": "B-T047",
125
- "75": "B-T033",
126
- "76": "B-T038",
127
- "77": "I-T023",
128
- "78": "I-T038",
129
- "79": "I-T017",
130
- "80": "B-T092",
131
- "81": "O",
132
- "82": "B-T167",
133
- "83": "B-T063",
134
- "84": "B-T022",
135
- "85": "I-T019",
136
- "86": "I-T058",
137
- "87": "B-T103",
138
- "88": "B-T109",
139
- "89": "I-T043",
140
- "90": "I-T062",
141
- "91": "B-T020",
142
- "92": "B-T017",
143
- "93": "B-T028",
144
- "94": "I-T022",
145
- "95": "B-T091",
146
- "96": "I-T024",
147
- "97": "I-T046",
148
- "98": "I-T098",
149
- "99": "B-T184",
150
- "100": "I-T170",
151
- "101": "B-T031",
152
- "102": "B-T196",
153
- "103": "I-T039",
154
- "104": "I-T091",
155
- "105": "I-T020",
156
- "106": "B-T201",
157
- "107": "B-T168"
158
  },
159
  "initializer_range": 0.02,
160
  "intermediate_size": null,
161
  "label2id": {
162
- "B-T005": 5,
163
- "B-T007": 47,
164
- "B-T017": 92,
165
- "B-T019": 13,
166
- "B-T020": 91,
167
- "B-T022": 84,
168
- "B-T023": 0,
169
- "B-T024": 58,
170
- "B-T025": 36,
171
- "B-T026": 23,
172
- "B-T028": 93,
173
- "B-T031": 101,
174
- "B-T033": 75,
175
- "B-T037": 65,
176
- "B-T038": 76,
177
- "B-T039": 67,
178
- "B-T040": 18,
179
- "B-T041": 62,
180
- "B-T043": 25,
181
  "B-T044": 19,
182
- "B-T045": 48,
183
- "B-T046": 44,
184
- "B-T047": 74,
185
- "B-T048": 37,
186
- "B-T058": 6,
187
- "B-T059": 60,
188
- "B-T062": 10,
189
- "B-T063": 83,
190
- "B-T070": 63,
191
- "B-T074": 69,
192
- "B-T080": 29,
193
- "B-T081": 16,
194
- "B-T082": 12,
195
- "B-T091": 95,
196
- "B-T092": 80,
197
- "B-T097": 8,
198
- "B-T098": 40,
199
- "B-T103": 87,
200
  "B-T104": 50,
201
- "B-T109": 88,
202
- "B-T114": 7,
203
- "B-T116": 33,
204
- "B-T121": 66,
205
- "B-T123": 57,
206
- "B-T125": 71,
207
- "B-T129": 21,
208
- "B-T131": 64,
209
- "B-T167": 82,
210
- "B-T168": 107,
211
- "B-T169": 68,
212
- "B-T170": 39,
213
- "B-T184": 99,
214
- "B-T190": 27,
215
- "B-T191": 70,
216
- "B-T196": 102,
217
- "B-T197": 43,
218
- "B-T201": 106,
219
- "B-T204": 61,
220
- "I-T005": 31,
221
- "I-T007": 28,
222
- "I-T017": 79,
223
- "I-T019": 85,
224
- "I-T020": 105,
225
- "I-T022": 94,
226
- "I-T023": 77,
227
- "I-T024": 96,
228
- "I-T025": 59,
229
- "I-T026": 46,
230
- "I-T028": 30,
231
- "I-T031": 38,
232
- "I-T033": 11,
233
- "I-T037": 34,
234
- "I-T038": 78,
235
- "I-T039": 103,
236
- "I-T041": 41,
237
- "I-T043": 89,
238
- "I-T044": 1,
239
- "I-T045": 51,
240
- "I-T046": 97,
241
- "I-T047": 49,
242
- "I-T048": 17,
243
- "I-T058": 86,
244
- "I-T059": 26,
245
- "I-T062": 90,
246
- "I-T063": 9,
247
- "I-T070": 73,
248
- "I-T074": 2,
249
- "I-T082": 56,
250
- "I-T091": 104,
251
- "I-T092": 32,
252
- "I-T097": 14,
253
- "I-T098": 98,
254
- "I-T103": 52,
255
- "I-T109": 3,
256
- "I-T114": 4,
257
- "I-T116": 72,
258
- "I-T121": 24,
259
- "I-T125": 20,
260
- "I-T129": 55,
261
- "I-T167": 22,
262
- "I-T168": 15,
263
- "I-T170": 100,
264
- "I-T184": 45,
265
- "I-T190": 53,
266
- "I-T191": 35,
267
- "I-T201": 54,
268
- "I-T204": 42,
269
- "O": 81
270
  },
271
  "layer_norm_epsilon": 1e-05,
272
  "max_position_embeddings": 2048,
 
47
  "gradient_checkpointing": false,
48
  "hidden_size": 2048,
49
  "id2label": {
50
+ "0": "I-T191",
51
+ "1": "I-T038",
52
+ "2": "I-T048",
53
+ "3": "B-T062",
54
+ "4": "O",
55
+ "5": "I-T031",
56
+ "6": "I-T025",
57
+ "7": "I-T043",
58
+ "8": "B-T031",
59
+ "9": "B-T005",
60
+ "10": "B-T023",
61
+ "11": "B-T033",
62
+ "12": "I-T026",
63
+ "13": "B-T116",
64
+ "14": "I-T020",
65
+ "15": "B-T201",
66
+ "16": "I-T024",
67
+ "17": "B-T039",
68
+ "18": "B-T037",
69
  "19": "B-T044",
70
+ "20": "I-T170",
71
+ "21": "I-T063",
72
+ "22": "I-T204",
73
+ "23": "B-T017",
74
+ "24": "I-T167",
75
+ "25": "B-T045",
76
+ "26": "B-T131",
77
+ "27": "I-T201",
78
+ "28": "I-T103",
79
+ "29": "B-T170",
80
+ "30": "B-T168",
81
+ "31": "B-T046",
82
+ "32": "I-T037",
83
+ "33": "B-T190",
84
+ "34": "I-T184",
85
+ "35": "I-T059",
86
+ "36": "B-T058",
87
+ "37": "B-T167",
88
+ "38": "B-T103",
89
+ "39": "B-T074",
90
+ "40": "B-T024",
91
+ "41": "I-T017",
92
+ "42": "I-T097",
93
+ "43": "I-T070",
94
+ "44": "B-T196",
95
+ "45": "B-T114",
96
+ "46": "B-T121",
97
+ "47": "B-T204",
98
+ "48": "B-T040",
99
+ "49": "B-T091",
100
  "50": "B-T104",
101
+ "51": "I-T007",
102
+ "52": "B-T070",
103
+ "53": "I-T023",
104
+ "54": "I-T045",
105
+ "55": "B-T063",
106
+ "56": "I-T058",
107
+ "57": "B-T169",
108
+ "58": "B-T025",
109
+ "59": "I-T044",
110
+ "60": "I-T033",
111
+ "61": "I-T091",
112
+ "62": "B-T028",
113
+ "63": "I-T168",
114
+ "64": "B-T184",
115
+ "65": "B-T123",
116
+ "66": "B-T026",
117
+ "67": "B-T092",
118
+ "68": "B-T191",
119
+ "69": "I-T047",
120
+ "70": "I-T114",
121
+ "71": "I-T022",
122
+ "72": "I-T125",
123
+ "73": "I-T116",
124
+ "74": "B-T007",
125
+ "75": "B-T022",
126
+ "76": "B-T080",
127
+ "77": "B-T019",
128
+ "78": "I-T039",
129
+ "79": "B-T098",
130
+ "80": "B-T109",
131
+ "81": "B-T125",
132
+ "82": "B-T048",
133
+ "83": "B-T059",
134
+ "84": "I-T190",
135
+ "85": "I-T092",
136
+ "86": "B-T038",
137
+ "87": "I-T019",
138
+ "88": "B-T097",
139
+ "89": "I-T109",
140
+ "90": "I-T046",
141
+ "91": "I-T082",
142
+ "92": "I-T062",
143
+ "93": "I-T129",
144
+ "94": "B-T082",
145
+ "95": "I-T005",
146
+ "96": "I-T028",
147
+ "97": "I-T041",
148
+ "98": "B-T041",
149
+ "99": "B-T047",
150
+ "100": "B-T197",
151
+ "101": "I-T121",
152
+ "102": "B-T020",
153
+ "103": "I-T074",
154
+ "104": "B-T043",
155
+ "105": "I-T098",
156
+ "106": "B-T081",
157
+ "107": "B-T129"
158
  },
159
  "initializer_range": 0.02,
160
  "intermediate_size": null,
161
  "label2id": {
162
+ "B-T005": 9,
163
+ "B-T007": 74,
164
+ "B-T017": 23,
165
+ "B-T019": 77,
166
+ "B-T020": 102,
167
+ "B-T022": 75,
168
+ "B-T023": 10,
169
+ "B-T024": 40,
170
+ "B-T025": 58,
171
+ "B-T026": 66,
172
+ "B-T028": 62,
173
+ "B-T031": 8,
174
+ "B-T033": 11,
175
+ "B-T037": 18,
176
+ "B-T038": 86,
177
+ "B-T039": 17,
178
+ "B-T040": 48,
179
+ "B-T041": 98,
180
+ "B-T043": 104,
181
  "B-T044": 19,
182
+ "B-T045": 25,
183
+ "B-T046": 31,
184
+ "B-T047": 99,
185
+ "B-T048": 82,
186
+ "B-T058": 36,
187
+ "B-T059": 83,
188
+ "B-T062": 3,
189
+ "B-T063": 55,
190
+ "B-T070": 52,
191
+ "B-T074": 39,
192
+ "B-T080": 76,
193
+ "B-T081": 106,
194
+ "B-T082": 94,
195
+ "B-T091": 49,
196
+ "B-T092": 67,
197
+ "B-T097": 88,
198
+ "B-T098": 79,
199
+ "B-T103": 38,
200
  "B-T104": 50,
201
+ "B-T109": 80,
202
+ "B-T114": 45,
203
+ "B-T116": 13,
204
+ "B-T121": 46,
205
+ "B-T123": 65,
206
+ "B-T125": 81,
207
+ "B-T129": 107,
208
+ "B-T131": 26,
209
+ "B-T167": 37,
210
+ "B-T168": 30,
211
+ "B-T169": 57,
212
+ "B-T170": 29,
213
+ "B-T184": 64,
214
+ "B-T190": 33,
215
+ "B-T191": 68,
216
+ "B-T196": 44,
217
+ "B-T197": 100,
218
+ "B-T201": 15,
219
+ "B-T204": 47,
220
+ "I-T005": 95,
221
+ "I-T007": 51,
222
+ "I-T017": 41,
223
+ "I-T019": 87,
224
+ "I-T020": 14,
225
+ "I-T022": 71,
226
+ "I-T023": 53,
227
+ "I-T024": 16,
228
+ "I-T025": 6,
229
+ "I-T026": 12,
230
+ "I-T028": 96,
231
+ "I-T031": 5,
232
+ "I-T033": 60,
233
+ "I-T037": 32,
234
+ "I-T038": 1,
235
+ "I-T039": 78,
236
+ "I-T041": 97,
237
+ "I-T043": 7,
238
+ "I-T044": 59,
239
+ "I-T045": 54,
240
+ "I-T046": 90,
241
+ "I-T047": 69,
242
+ "I-T048": 2,
243
+ "I-T058": 56,
244
+ "I-T059": 35,
245
+ "I-T062": 92,
246
+ "I-T063": 21,
247
+ "I-T070": 43,
248
+ "I-T074": 103,
249
+ "I-T082": 91,
250
+ "I-T091": 61,
251
+ "I-T092": 85,
252
+ "I-T097": 42,
253
+ "I-T098": 105,
254
+ "I-T103": 28,
255
+ "I-T109": 89,
256
+ "I-T114": 70,
257
+ "I-T116": 73,
258
+ "I-T121": 101,
259
+ "I-T125": 72,
260
+ "I-T129": 93,
261
+ "I-T167": 24,
262
+ "I-T168": 63,
263
+ "I-T170": 20,
264
+ "I-T184": 34,
265
+ "I-T190": 84,
266
+ "I-T191": 0,
267
+ "I-T201": 27,
268
+ "I-T204": 22,
269
+ "O": 4
270
  },
271
  "layer_norm_epsilon": 1e-05,
272
  "max_position_embeddings": 2048,
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30717d510e73efac7ea091447f27cb3041934da161fdc8b8a2b5aeb507ea007d
3
  size 4993794184
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad5e509452472b359780e71cff9213aaa2cdc878b1713739a4575a47d1a99efe
3
  size 4993794184
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b83ae006bf803333da263092a79cf7c0e3d10a895ee55087bbe49ceb45d3a41
3
  size 269429120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6885b9686901810b05407953c1528ab92c3975a9fed67981d3a3463b23ee8bd3
3
  size 269429120
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aca836050c94f1c9e52e21c4a73b3318d10be3b79a3bc4c4ff8cd09eeeba963a
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a027e0259c28b5559a4e924b64dbbc3a127b433c503ae13f97c8163d603fa8d
3
  size 5368