YWZBrandon commited on
Commit
67a170a
·
verified ·
1 Parent(s): 1f88cae

End of training

Browse files
20250513_010808.log ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0
  0%| | 0/782 [00:00<?, ?it/s]/root/miniconda3/envs/wikidyk/lib/python3.10/site-packages/transformers/tokenization_utils_base.py:3980: UserWarning: `as_target_tokenizer` is deprecated and will be removed in v5 of Transformers. You can tokenize your labels by using the argument `text_target` of the regular `__call__` method (either in the same call as your input texts if you use the same keyword arguments, or in a separate call.
 
 
 
 
1
  0%| | 1/782 [00:00<11:29, 1.13it/s]
2
  0%| | 2/782 [00:02<15:37, 1.20s/it]
3
  0%| | 3/782 [00:02<11:24, 1.14it/s]
4
  1%| | 4/782 [00:03<09:45, 1.33it/s]
5
  1%| | 5/782 [00:03<08:53, 1.46it/s]
6
  1%| | 6/782 [00:04<07:57, 1.62it/s]
7
  1%| | 7/782 [00:05<10:15, 1.26it/s]
8
  1%| | 8/782 [00:06<09:03, 1.42it/s]
9
  1%| | 9/782 [00:06<08:31, 1.51it/s]
10
  1%|▏ | 10/782 [00:07<08:10, 1.57it/s]
11
  1%|▏ | 11/782 [00:07<07:35, 1.69it/s]
12
  2%|▏ | 12/782 [00:08<07:17, 1.76it/s]
13
  2%|▏ | 13/782 [00:08<07:22, 1.74it/s]
14
  2%|▏ | 14/782 [00:09<07:07, 1.80it/s]
15
  2%|▏ | 15/782 [00:09<06:59, 1.83it/s]
16
  2%|▏ | 16/782 [00:10<06:50, 1.87it/s]
17
  2%|▏ | 17/782 [00:10<06:54, 1.85it/s]
18
  2%|▏ | 18/782 [00:11<06:49, 1.87it/s]
19
  2%|▏ | 19/782 [00:11<06:42, 1.90it/s]
20
  3%|▎ | 20/782 [00:12<06:51, 1.85it/s]
21
  3%|▎ | 21/782 [00:13<06:52, 1.85it/s]
22
  3%|▎ | 22/782 [00:13<06:37, 1.91it/s]
23
  3%|▎ | 23/782 [00:14<06:56, 1.82it/s]
24
  3%|▎ | 24/782 [00:14<06:59, 1.81it/s]
25
  3%|▎ | 25/782 [00:15<06:37, 1.90it/s]
26
  3%|▎ | 26/782 [00:15<06:40, 1.89it/s]
27
  3%|▎ | 27/782 [00:16<06:50, 1.84it/s]
28
  4%|▎ | 28/782 [00:16<06:48, 1.85it/s]
29
  4%|▎ | 29/782 [00:17<06:40, 1.88it/s]
30
  4%|▍ | 30/782 [00:17<06:41, 1.87it/s]
31
  4%|▍ | 31/782 [00:18<06:38, 1.89it/s]
32
  4%|▍ | 32/782 [00:18<06:35, 1.89it/s]
33
  4%|▍ | 33/782 [00:19<06:40, 1.87it/s]
34
  4%|▍ | 34/782 [00:19<06:34, 1.89it/s]
35
  4%|▍ | 35/782 [00:20<06:34, 1.90it/s]
36
  5%|▍ | 36/782 [00:21<06:40, 1.86it/s]
37
  5%|▍ | 37/782 [00:21<06:29, 1.91it/s]
38
  5%|▍ | 38/782 [00:22<08:52, 1.40it/s]
39
  5%|▍ | 39/782 [00:23<08:07, 1.52it/s]
40
  5%|▌ | 40/782 [00:23<07:41, 1.61it/s]
41
  5%|▌ | 41/782 [00:24<07:14, 1.71it/s]
42
  5%|▌ | 42/782 [00:24<06:50, 1.80it/s]
43
  5%|▌ | 43/782 [00:25<06:53, 1.79it/s]
44
  6%|▌ | 44/782 [00:25<07:05, 1.74it/s]
45
  6%|▌ | 45/782 [00:26<06:50, 1.80it/s]
46
  6%|▌ | 46/782 [00:27<06:47, 1.81it/s]
47
  6%|▌ | 47/782 [00:27<06:47, 1.80it/s]
48
  6%|▌ | 48/782 [00:28<06:53, 1.78it/s]
49
  6%|▋ | 49/782 [00:28<06:33, 1.86it/s]
50
  6%|▋ | 50/782 [00:29<06:33, 1.86it/s]
51
 
 
52
  6%|▋ | 50/782 [00:29<06:33, 1.86it/s]
53
  7%|▋ | 51/782 [00:29<06:53, 1.77it/s]
54
  7%|▋ | 52/782 [00:30<06:49, 1.78it/s]
55
  7%|▋ | 53/782 [00:30<06:34, 1.85it/s]
56
  7%|▋ | 54/782 [00:31<06:31, 1.86it/s]
57
  7%|▋ | 55/782 [00:32<06:50, 1.77it/s]
58
  7%|▋ | 56/782 [00:32<06:42, 1.80it/s]
59
  7%|▋ | 57/782 [00:33<06:32, 1.85it/s]
60
  7%|▋ | 58/782 [00:33<06:25, 1.88it/s]
61
  8%|▊ | 59/782 [00:34<06:32, 1.84it/s]
62
  8%|▊ | 60/782 [00:34<06:28, 1.86it/s]
63
  8%|▊ | 61/782 [00:35<06:18, 1.90it/s]
64
  8%|▊ | 62/782 [00:36<08:41, 1.38it/s]
65
  8%|▊ | 63/782 [00:36<08:00, 1.50it/s]
66
  8%|▊ | 64/782 [00:37<07:31, 1.59it/s]
67
  8%|▊ | 65/782 [00:37<06:59, 1.71it/s]
68
  8%|▊ | 66/782 [00:38<06:56, 1.72it/s]
69
  9%|▊ | 67/782 [00:39<06:52, 1.73it/s]
70
  9%|▊ | 68/782 [00:39<06:35, 1.81it/s]
71
  9%|▉ | 69/782 [00:40<06:38, 1.79it/s]
72
  9%|▉ | 70/782 [00:40<06:58, 1.70it/s]
73
  9%|▉ | 71/782 [00:41<06:36, 1.79it/s]
74
  9%|▉ | 72/782 [00:41<06:26, 1.84it/s]
75
  9%|▉ | 73/782 [00:42<06:22, 1.85it/s]
76
  9%|▉ | 74/782 [00:42<06:24, 1.84it/s]
77
  10%|▉ | 75/782 [00:43<06:24, 1.84it/s]
78
  10%|▉ | 76/782 [00:43<06:30, 1.81it/s]
79
  10%|▉ | 77/782 [00:44<06:43, 1.75it/s]
80
  10%|▉ | 78/782 [00:45<06:40, 1.76it/s]
81
  10%|█ | 79/782 [00:45<06:28, 1.81it/s]
82
  10%|█ | 80/782 [00:46<06:27, 1.81it/s]
83
  10%|█ | 81/782 [00:46<06:33, 1.78it/s]
84
  10%|█ | 82/782 [00:47<06:17, 1.85it/s]
85
  11%|█ | 83/782 [00:47<06:09, 1.89it/s]
86
  11%|█ | 84/782 [00:48<06:09, 1.89it/s]
87
  11%|█ | 85/782 [00:48<06:16, 1.85it/s]
88
  11%|█ | 86/782 [00:49<06:16, 1.85it/s]
89
  11%|█ | 87/782 [00:49<06:07, 1.89it/s]
90
  11%|█▏ | 88/782 [00:50<06:10, 1.87it/s]
91
  11%|█▏ | 89/782 [00:50<06:07, 1.89it/s]
92
  12%|█▏ | 90/782 [00:51<06:02, 1.91it/s]
93
  12%|█▏ | 91/782 [00:52<06:33, 1.76it/s]
94
  12%|█▏ | 92/782 [00:53<09:21, 1.23it/s]
95
  12%|█▏ | 93/782 [00:54<08:28, 1.35it/s]
96
  12%|█▏ | 94/782 [00:54<07:33, 1.52it/s]
97
  12%|█▏ | 95/782 [00:55<07:15, 1.58it/s]
98
  12%|█▏ | 96/782 [00:55<07:19, 1.56it/s]
99
  12%|█▏ | 97/782 [00:56<06:48, 1.68it/s]
100
  13%|█▎ | 98/782 [00:56<06:40, 1.71it/s]
101
  13%|█▎ | 99/782 [00:57<06:28, 1.76it/s]
102
  13%|█▎ | 100/782 [00:57<06:23, 1.78it/s]
103
 
 
104
  13%|█▎ | 100/782 [00:58<06:23, 1.78it/s]
105
  13%|█▎ | 101/782 [00:58<06:15, 1.81it/s]
106
  13%|█▎ | 102/782 [00:59<06:08, 1.84it/s]
107
  13%|█▎ | 103/782 [00:59<06:12, 1.82it/s]
108
  13%|█▎ | 104/782 [01:00<06:14, 1.81it/s]
109
  13%|█▎ | 105/782 [01:00<06:01, 1.87it/s]
110
  14%|█▎ | 106/782 [01:01<05:58, 1.88it/s]
111
  14%|█▎ | 107/782 [01:01<06:06, 1.84it/s]
112
  14%|█▍ | 108/782 [01:02<05:53, 1.91it/s]
113
  14%|█▍ | 109/782 [01:02<05:59, 1.87it/s]
114
  14%|█▍ | 110/782 [01:03<06:05, 1.84it/s]
115
  14%|█▍ | 111/782 [01:03<05:54, 1.89it/s]
116
  14%|█▍ | 112/782 [01:04<05:57, 1.87it/s]
117
  14%|█▍ | 113/782 [01:04<06:02, 1.85it/s]
118
  15%|█▍ | 114/782 [01:05<05:52, 1.89it/s]
119
  15%|█▍ | 115/782 [01:05<05:59, 1.85it/s]
120
  15%|█▍ | 116/782 [01:06<06:02, 1.84it/s]
121
  15%|█▍ | 117/782 [01:07<05:49, 1.90it/s]
122
  15%|█▌ | 118/782 [01:07<05:57, 1.86it/s]
123
  15%|█▌ | 119/782 [01:08<06:02, 1.83it/s]
124
  15%|█▌ | 120/782 [01:08<05:54, 1.87it/s]
125
  15%|█▌ | 121/782 [01:09<05:52, 1.88it/s]
126
  16%|█▌ | 122/782 [01:09<06:00, 1.83it/s]
127
  16%|█▌ | 123/782 [01:10<05:54, 1.86it/s]
128
  16%|█▌ | 124/782 [01:10<05:49, 1.89it/s]
129
  16%|█▌ | 125/782 [01:11<05:45, 1.90it/s]
130
  16%|█▌ | 126/782 [01:11<05:49, 1.88it/s]
131
  16%|█▌ | 127/782 [01:12<05:41, 1.92it/s]
132
  16%|█▋ | 128/782 [01:12<05:33, 1.96it/s]
133
  16%|█▋ | 129/782 [01:13<05:43, 1.90it/s]
134
  17%|█▋ | 130/782 [01:13<05:48, 1.87it/s]
135
  17%|█▋ | 131/782 [01:14<05:36, 1.94it/s]
136
  17%|█▋ | 132/782 [01:14<05:44, 1.89it/s]
137
  17%|█▋ | 133/782 [01:15<05:58, 1.81it/s]
138
  17%|█▋ | 134/782 [01:16<05:47, 1.87it/s]
139
  17%|█▋ | 135/782 [01:16<05:53, 1.83it/s]
140
  17%|█▋ | 136/782 [01:17<06:16, 1.72it/s]
141
  18%|█▊ | 137/782 [01:17<05:56, 1.81it/s]
142
  18%|█▊ | 138/782 [01:18<05:55, 1.81it/s]
143
  18%|█▊ | 139/782 [01:18<06:02, 1.77it/s]
144
  18%|█▊ | 140/782 [01:19<05:45, 1.86it/s]
145
  18%|█▊ | 141/782 [01:19<05:41, 1.88it/s]
146
  18%|█▊ | 142/782 [01:20<05:41, 1.88it/s]
147
  18%|█▊ | 143/782 [01:20<05:35, 1.91it/s]
148
  18%|█▊ | 144/782 [01:21<05:34, 1.91it/s]
149
  19%|█▊ | 145/782 [01:22<05:32, 1.92it/s]
150
  19%|█▊ | 146/782 [01:22<05:53, 1.80it/s]
151
  19%|█▉ | 147/782 [01:23<05:42, 1.86it/s]
152
  19%|█▉ | 148/782 [01:23<05:40, 1.86it/s]
153
  19%|█▉ | 149/782 [01:24<05:44, 1.84it/s]
154
  19%|█▉ | 150/782 [01:24<05:44, 1.84it/s]
155
 
 
156
  19%|█▉ | 150/782 [01:24<05:44, 1.84it/s]
157
  19%|█▉ | 151/782 [01:25<05:36, 1.87it/s]
158
  19%|█▉ | 152/782 [01:25<05:39, 1.86it/s]
159
  20%|█▉ | 153/782 [01:26<05:49, 1.80it/s]
160
  20%|█▉ | 154/782 [01:26<05:34, 1.88it/s]
161
  20%|█▉ | 155/782 [01:27<05:42, 1.83it/s]
162
  20%|█▉ | 156/782 [01:28<05:57, 1.75it/s]
163
  20%|██ | 157/782 [01:28<05:43, 1.82it/s]
164
  20%|██ | 158/782 [01:29<05:38, 1.85it/s]
165
  20%|██ | 159/782 [01:29<05:47, 1.79it/s]
166
  20%|██ | 160/782 [01:30<05:37, 1.84it/s]
167
  21%|██ | 161/782 [01:30<05:37, 1.84it/s]
168
  21%|██ | 162/782 [01:31<05:53, 1.75it/s]
169
  21%|██ | 163/782 [01:31<05:43, 1.80it/s]
170
  21%|██ | 164/782 [01:32<05:34, 1.85it/s]
171
  21%|██ | 165/782 [01:32<05:27, 1.88it/s]
172
  21%|██ | 166/782 [01:33<05:31, 1.86it/s]
173
  21%|██▏ | 167/782 [01:34<05:51, 1.75it/s]
174
  21%|██▏ | 168/782 [01:34<05:29, 1.86it/s]
175
  22%|██▏ | 169/782 [01:35<05:31, 1.85it/s]
176
  22%|██▏ | 170/782 [01:35<05:39, 1.80it/s]
177
  22%|██▏ | 171/782 [01:36<05:23, 1.89it/s]
178
  22%|██▏ | 172/782 [01:36<05:27, 1.86it/s]
179
  22%|██▏ | 173/782 [01:37<05:29, 1.85it/s]
180
  22%|██▏ | 174/782 [01:37<05:31, 1.84it/s]
181
  22%|██▏ | 175/782 [01:38<05:23, 1.88it/s]
182
  23%|██▎ | 176/782 [01:38<05:26, 1.86it/s]
183
  23%|██▎ | 177/782 [01:39<05:23, 1.87it/s]
184
  23%|██▎ | 178/782 [01:40<05:23, 1.86it/s]
185
  23%|██▎ | 179/782 [01:40<05:17, 1.90it/s]
186
  23%|██▎ | 180/782 [01:41<05:24, 1.86it/s]
187
  23%|██▎ | 181/782 [01:41<05:21, 1.87it/s]
188
  23%|██▎ | 182/782 [01:42<05:21, 1.87it/s]
189
  23%|██▎ | 183/782 [01:42<05:22, 1.86it/s]
190
  24%|██▎ | 184/782 [01:43<05:19, 1.87it/s]
191
  24%|██▎ | 185/782 [01:43<05:20, 1.86it/s]
192
  24%|██▍ | 186/782 [01:44<05:28, 1.82it/s]
193
  24%|██▍ | 187/782 [01:44<05:18, 1.87it/s]
194
  24%|██▍ | 188/782 [01:45<05:15, 1.89it/s]
195
  24%|██▍ | 189/782 [01:45<05:16, 1.87it/s]
196
  24%|██▍ | 190/782 [01:46<05:16, 1.87it/s]
197
  24%|██▍ | 191/782 [01:46<05:12, 1.89it/s]
198
  25%|██▍ | 192/782 [01:47<05:29, 1.79it/s]
199
  25%|██▍ | 193/782 [01:48<05:26, 1.81it/s]
200
  25%|██▍ | 194/782 [01:48<05:18, 1.84it/s]
201
  25%|██▍ | 195/782 [01:49<05:22, 1.82it/s]
202
  25%|██▌ | 196/782 [01:49<05:20, 1.83it/s]
203
  25%|██▌ | 197/782 [01:50<05:10, 1.88it/s]
204
  25%|██▌ | 198/782 [01:50<05:15, 1.85it/s]
205
  25%|██▌ | 199/782 [01:51<05:31, 1.76it/s]
206
  26%|██▌ | 200/782 [01:51<05:20, 1.81it/s]
207
 
 
208
  26%|██▌ | 200/782 [01:52<05:20, 1.81it/s]
209
  26%|██▌ | 201/782 [01:52<05:17, 1.83it/s]
210
  26%|██▌ | 202/782 [01:53<05:25, 1.78it/s]
211
  26%|██▌ | 203/782 [01:53<05:12, 1.85it/s]
212
  26%|██▌ | 204/782 [01:54<05:13, 1.84it/s]
213
  26%|██▌ | 205/782 [01:54<05:23, 1.79it/s]
214
  26%|██▋ | 206/782 [01:55<05:07, 1.87it/s]
215
  26%|██▋ | 207/782 [01:55<05:09, 1.86it/s]
216
  27%|██▋ | 208/782 [01:56<05:20, 1.79it/s]
217
  27%|██▋ | 209/782 [01:56<05:12, 1.83it/s]
218
  27%|██▋ | 210/782 [01:57<05:05, 1.87it/s]
219
  27%|██▋ | 211/782 [01:57<05:03, 1.88it/s]
220
  27%|██▋ | 212/782 [01:58<05:05, 1.86it/s]
221
  27%|██▋ | 213/782 [01:59<05:15, 1.80it/s]
222
  27%|██▋ | 214/782 [01:59<05:02, 1.88it/s]
223
  27%|██▋ | 215/782 [02:00<05:07, 1.85it/s]
224
  28%|██▊ | 216/782 [02:00<05:14, 1.80it/s]
225
  28%|██▊ | 217/782 [02:01<05:02, 1.87it/s]
226
  28%|██▊ | 218/782 [02:01<05:03, 1.86it/s]
227
  28%|██▊ | 219/782 [02:02<05:09, 1.82it/s]
228
  28%|██▊ | 220/782 [02:02<04:59, 1.88it/s]
229
  28%|██▊ | 221/782 [02:03<04:57, 1.89it/s]
230
  28%|██▊ | 222/782 [02:03<04:51, 1.92it/s]
231
  29%|██▊ | 223/782 [02:04<04:56, 1.89it/s]
232
  29%|██▊ | 224/782 [02:04<04:56, 1.88it/s]
233
  29%|██▉ | 225/782 [02:05<04:48, 1.93it/s]
234
  29%|██▉ | 226/782 [02:05<04:55, 1.88it/s]
235
  29%|██▉ | 227/782 [02:06<05:02, 1.83it/s]
236
  29%|██▉ | 228/782 [02:07<04:53, 1.89it/s]
237
  29%|██▉ | 229/782 [02:07<04:54, 1.87it/s]
238
  29%|██▉ | 230/782 [02:08<05:09, 1.78it/s]
239
  30%|██▉ | 231/782 [02:08<04:57, 1.85it/s]
240
  30%|██▉ | 232/782 [02:09<04:58, 1.84it/s]
241
  30%|██▉ | 233/782 [02:09<05:01, 1.82it/s]
242
  30%|██▉ | 234/782 [02:10<04:59, 1.83it/s]
243
  30%|███ | 235/782 [02:10<04:55, 1.85it/s]
244
  30%|███ | 236/782 [02:11<04:54, 1.85it/s]
245
  30%|███ | 237/782 [02:11<04:55, 1.84it/s]
246
  30%|███ | 238/782 [02:12<04:45, 1.90it/s]
247
  31%|███ | 239/782 [02:12<04:47, 1.89it/s]
248
  31%|███ | 240/782 [02:13<04:52, 1.86it/s]
249
  31%|███ | 241/782 [02:14<04:54, 1.84it/s]
250
  31%|███ | 242/782 [02:14<04:39, 1.93it/s]
251
  31%|███ | 243/782 [02:15<04:43, 1.90it/s]
252
  31%|███ | 244/782 [02:15<05:08, 1.74it/s]
253
  31%|███▏ | 245/782 [02:16<04:53, 1.83it/s]
254
  31%|███▏ | 246/782 [02:16<04:51, 1.84it/s]
255
  32%|███▏ | 247/782 [02:17<04:48, 1.86it/s]
256
  32%|███▏ | 248/782 [02:17<04:54, 1.81it/s]
257
  32%|███▏ | 249/782 [02:18<04:53, 1.82it/s]
258
  32%|███▏ | 250/782 [02:18<04:40, 1.90it/s]
259
 
 
260
  32%|███▏ | 250/782 [02:19<04:40, 1.90it/s]
261
  32%|███▏ | 251/782 [02:19<04:45, 1.86it/s]
262
  32%|███▏ | 252/782 [02:20<04:51, 1.82it/s]
263
  32%|███▏ | 253/782 [02:20<04:42, 1.87it/s]
264
  32%|███▏ | 254/782 [02:21<04:40, 1.88it/s]
265
  33%|███▎ | 255/782 [02:21<04:39, 1.89it/s]
266
  33%|███▎ | 256/782 [02:22<04:37, 1.90it/s]
267
  33%|███▎ | 257/782 [02:22<04:34, 1.91it/s]
268
  33%|███▎ | 258/782 [02:23<04:36, 1.89it/s]
269
  33%|███▎ | 259/782 [02:23<04:45, 1.83it/s]
270
  33%|███▎ | 260/782 [02:24<04:37, 1.88it/s]
271
  33%|███▎ | 261/782 [02:24<04:31, 1.92it/s]
272
  34%|███▎ | 262/782 [02:25<04:36, 1.88it/s]
273
  34%|███▎ | 263/782 [02:25<04:38, 1.86it/s]
274
  34%|███▍ | 264/782 [02:26<04:37, 1.87it/s]
275
  34%|███▍ | 265/782 [02:26<04:40, 1.84it/s]
276
  34%|███▍ | 266/782 [02:27<04:33, 1.89it/s]
277
  34%|███▍ | 267/782 [02:28<04:37, 1.86it/s]
278
  34%|███▍ | 268/782 [02:28<04:43, 1.81it/s]
279
  34%|███▍ | 269/782 [02:29<04:47, 1.78it/s]
280
  35%|███▍ | 270/782 [02:29<04:36, 1.85it/s]
281
  35%|███▍ | 271/782 [02:30<04:40, 1.82it/s]
282
  35%|███▍ | 272/782 [02:30<04:49, 1.76it/s]
283
  35%|███▍ | 273/782 [02:31<04:37, 1.84it/s]
284
  35%|███▌ | 274/782 [02:31<04:35, 1.84it/s]
285
  35%|███▌ | 275/782 [02:32<04:41, 1.80it/s]
286
  35%|███▌ | 276/782 [02:32<04:30, 1.87it/s]
287
  35%|███▌ | 277/782 [02:33<04:35, 1.83it/s]
288
  36%|███▌ | 278/782 [02:34<04:34, 1.84it/s]
289
  36%|███▌ | 279/782 [02:34<04:33, 1.84it/s]
290
  36%|███▌ | 280/782 [02:35<04:33, 1.84it/s]
291
  36%|███▌ | 281/782 [02:35<04:36, 1.81it/s]
292
  36%|███▌ | 282/782 [02:36<04:26, 1.88it/s]
293
  36%|███▌ | 283/782 [02:36<04:29, 1.85it/s]
294
  36%|███▋ | 284/782 [02:37<04:38, 1.79it/s]
295
  36%|███▋ | 285/782 [02:37<04:29, 1.85it/s]
296
  37%|███▋ | 286/782 [02:38<04:30, 1.83it/s]
297
  37%|███▋ | 287/782 [02:38<04:28, 1.85it/s]
298
  37%|███▋ | 288/782 [02:39<04:22, 1.88it/s]
299
  37%|███▋ | 289/782 [02:40<04:24, 1.87it/s]
300
  37%|███▋ | 290/782 [02:40<04:41, 1.75it/s]
301
  37%|███▋ | 291/782 [02:41<04:33, 1.80it/s]
302
  37%|███▋ | 292/782 [02:41<04:29, 1.82it/s]
303
  37%|███▋ | 293/782 [02:42<04:37, 1.76it/s]
304
  38%|███▊ | 294/782 [02:42<04:24, 1.85it/s]
305
  38%|███▊ | 295/782 [02:43<04:26, 1.83it/s]
306
  38%|███▊ | 296/782 [02:43<04:32, 1.78it/s]
307
  38%|███▊ | 297/782 [02:44<04:26, 1.82it/s]
308
  38%|███▊ | 298/782 [02:44<04:17, 1.88it/s]
309
  38%|███▊ | 299/782 [02:45<04:18, 1.87it/s]
310
  38%|███▊ | 300/782 [02:46<04:16, 1.88it/s]
311
 
 
312
  38%|███▊ | 300/782 [02:46<04:16, 1.88it/s]
313
  38%|███▊ | 301/782 [02:46<04:18, 1.86it/s]
314
  39%|███▊ | 302/782 [02:47<04:18, 1.86it/s]
315
  39%|███▊ | 303/782 [02:47<04:20, 1.84it/s]
316
  39%|███▉ | 304/782 [02:48<04:19, 1.84it/s]
317
  39%|███▉ | 305/782 [02:48<04:13, 1.88it/s]
318
  39%|██���▉ | 306/782 [02:49<04:16, 1.86it/s]
319
  39%|███▉ | 307/782 [02:49<04:10, 1.89it/s]
320
  39%|███▉ | 308/782 [02:50<04:10, 1.89it/s]
321
  40%|███▉ | 309/782 [02:50<04:11, 1.88it/s]
322
  40%|███▉ | 310/782 [02:51<04:09, 1.89it/s]
323
  40%|███▉ | 311/782 [02:51<04:07, 1.90it/s]
324
  40%|███▉ | 312/782 [02:52<04:08, 1.89it/s]
325
  40%|████ | 313/782 [02:52<04:09, 1.88it/s]
326
  40%|████ | 314/782 [02:53<04:08, 1.88it/s]
327
  40%|████ | 315/782 [02:54<04:15, 1.83it/s]
328
  40%|████ | 316/782 [02:54<04:13, 1.84it/s]
329
  41%|████ | 317/782 [02:55<04:07, 1.88it/s]
330
  41%|████ | 318/782 [02:55<04:06, 1.88it/s]
331
  41%|████ | 319/782 [02:56<04:03, 1.90it/s]
332
  41%|████ | 320/782 [02:56<04:00, 1.92it/s]
333
  41%|████ | 321/782 [02:57<04:05, 1.87it/s]
334
  41%|████ | 322/782 [02:57<04:09, 1.84it/s]
335
  41%|████▏ | 323/782 [02:58<04:05, 1.87it/s]
336
  41%|████▏ | 324/782 [02:58<04:04, 1.88it/s]
337
  42%|████▏ | 325/782 [02:59<04:05, 1.86it/s]
338
  42%|████▏ | 326/782 [02:59<04:01, 1.89it/s]
339
  42%|████▏ | 327/782 [03:00<03:59, 1.90it/s]
340
  42%|████▏ | 328/782 [03:01<04:06, 1.84it/s]
341
  42%|████▏ | 329/782 [03:01<04:02, 1.86it/s]
342
  42%|████▏ | 330/782 [03:02<04:00, 1.88it/s]
343
  42%|████▏ | 331/782 [03:02<03:59, 1.88it/s]
344
  42%|████▏ | 332/782 [03:03<04:12, 1.78it/s]
345
  43%|████▎ | 333/782 [03:03<04:09, 1.80it/s]
346
  43%|████▎ | 334/782 [03:04<04:01, 1.86it/s]
347
  43%|████▎ | 335/782 [03:04<04:05, 1.82it/s]
348
  43%|████▎ | 336/782 [03:05<04:19, 1.72it/s]
349
  43%|████▎ | 337/782 [03:05<04:03, 1.83it/s]
350
  43%|████▎ | 338/782 [03:06<04:02, 1.83it/s]
351
  43%|████▎ | 339/782 [03:07<03:59, 1.85it/s]
352
  43%|████▎ | 340/782 [03:07<03:50, 1.91it/s]
353
  44%|████▎ | 341/782 [03:08<03:51, 1.90it/s]
354
  44%|████▎ | 342/782 [03:08<03:55, 1.87it/s]
355
  44%|████▍ | 343/782 [03:09<03:53, 1.88it/s]
356
  44%|████▍ | 344/782 [03:09<03:48, 1.91it/s]
357
  44%|████▍ | 345/782 [03:10<03:48, 1.92it/s]
358
  44%|████▍ | 346/782 [03:10<03:54, 1.86it/s]
359
  44%|████▍ | 347/782 [03:11<03:55, 1.85it/s]
360
  45%|████▍ | 348/782 [03:11<03:51, 1.88it/s]
361
  45%|████▍ | 349/782 [03:12<04:01, 1.79it/s]
362
  45%|████▍ | 350/782 [03:12<04:02, 1.78it/s]
363
 
 
364
  45%|████▍ | 350/782 [03:13<04:02, 1.78it/s]
365
  45%|████▍ | 351/782 [03:13<03:53, 1.84it/s]
366
  45%|████▌ | 352/782 [03:14<03:51, 1.86it/s]
367
  45%|████▌ | 353/782 [03:14<03:58, 1.80it/s]
368
  45%|████▌ | 354/782 [03:15<03:48, 1.88it/s]
369
  45%|████▌ | 355/782 [03:15<03:50, 1.86it/s]
370
  46%|████▌ | 356/782 [03:16<03:48, 1.86it/s]
371
  46%|████▌ | 357/782 [03:16<03:38, 1.95it/s]
372
  46%|████▌ | 358/782 [03:17<03:45, 1.88it/s]
373
  46%|████▌ | 359/782 [03:17<03:51, 1.83it/s]
374
  46%|████▌ | 360/782 [03:18<03:46, 1.86it/s]
375
  46%|████▌ | 361/782 [03:18<03:53, 1.81it/s]
376
  46%|████▋ | 362/782 [03:19<03:55, 1.78it/s]
377
  46%|████▋ | 363/782 [03:19<03:48, 1.84it/s]
378
  47%|████▋ | 364/782 [03:20<03:48, 1.83it/s]
379
  47%|████▋ | 365/782 [03:21<03:49, 1.82it/s]
380
  47%|████▋ | 366/782 [03:21<03:40, 1.89it/s]
381
  47%|████▋ | 367/782 [03:22<03:36, 1.92it/s]
382
  47%|████▋ | 368/782 [03:22<03:40, 1.88it/s]
383
  47%|████▋ | 369/782 [03:23<03:34, 1.92it/s]
384
  47%|████▋ | 370/782 [03:23<03:33, 1.93it/s]
385
  47%|████▋ | 371/782 [03:24<03:34, 1.92it/s]
386
  48%|████▊ | 372/782 [03:24<03:40, 1.86it/s]
387
  48%|████▊ | 373/782 [03:25<03:38, 1.87it/s]
388
  48%|████▊ | 374/782 [03:25<03:35, 1.89it/s]
389
  48%|████▊ | 375/782 [03:26<03:37, 1.87it/s]
390
  48%|████▊ | 376/782 [03:26<03:35, 1.88it/s]
391
  48%|████▊ | 377/782 [03:27<03:34, 1.89it/s]
392
  48%|████▊ | 378/782 [03:27<03:35, 1.88it/s]
393
  48%|████▊ | 379/782 [03:28<03:31, 1.91it/s]
394
  49%|████▊ | 380/782 [03:28<03:29, 1.91it/s]
395
  49%|████▊ | 381/782 [03:29<03:36, 1.85it/s]
396
  49%|████▉ | 382/782 [03:30<03:49, 1.74it/s]
397
  49%|████▉ | 383/782 [03:30<03:38, 1.83it/s]
398
  49%|████▉ | 384/782 [03:31<03:41, 1.79it/s]
399
  49%|████▉ | 385/782 [03:31<03:44, 1.77it/s]
400
  49%|████▉ | 386/782 [03:32<03:45, 1.76it/s]
401
  49%|████▉ | 387/782 [03:32<03:39, 1.80it/s]
402
  50%|████▉ | 388/782 [03:33<03:33, 1.84it/s]
403
  50%|████▉ | 389/782 [03:33<03:33, 1.84it/s]
404
  50%|████▉ | 390/782 [03:34<03:38, 1.79it/s]
405
  50%|█████ | 391/782 [03:35<03:28, 1.87it/s]
406
  50%|█████ | 392/782 [03:35<03:35, 1.81it/s]
407
  50%|█████ | 393/782 [03:36<03:48, 1.70it/s]
408
  50%|█████ | 394/782 [03:36<03:35, 1.80it/s]
409
  51%|█████ | 395/782 [03:37<03:34, 1.81it/s]
410
  51%|█████ | 396/782 [03:37<03:34, 1.80it/s]
411
  51%|█████ | 397/782 [03:38<03:31, 1.82it/s]
412
  51%|█████ | 398/782 [03:38<03:28, 1.84it/s]
413
  51%|█████ | 399/782 [03:39<03:31, 1.81it/s]
414
  51%|█████ | 400/782 [03:40<03:24, 1.87it/s]
415
 
 
416
  51%|█████ | 400/782 [03:40<03:24, 1.87it/s]
417
  51%|█████▏ | 401/782 [03:40<03:27, 1.84it/s]
418
  51%|█████▏ | 402/782 [03:41<03:33, 1.78it/s]
419
  52%|█████▏ | 403/782 [03:41<03:23, 1.86it/s]
420
  52%|█████▏ | 404/782 [03:42<03:23, 1.86it/s]
421
  52%|█████▏ | 405/782 [03:42<03:30, 1.79it/s]
422
  52%|█████▏ | 406/782 [03:43<03:20, 1.87it/s]
423
  52%|█████▏ | 407/782 [03:43<03:19, 1.88it/s]
424
  52%|█████▏ | 408/782 [03:44<03:23, 1.83it/s]
425
  52%|█████▏ | 409/782 [03:44<03:17, 1.89it/s]
426
  52%|█████▏ | 410/782 [03:45<03:16, 1.89it/s]
427
  53%|█████▎ | 411/782 [03:46<03:20, 1.85it/s]
428
  53%|█████▎ | 412/782 [03:46<03:22, 1.83it/s]
429
  53%|█████▎ | 413/782 [03:47<03:17, 1.87it/s]
430
  53%|█████▎ | 414/782 [03:47<03:14, 1.89it/s]
431
  53%|█████▎ | 415/782 [03:48<03:17, 1.86it/s]
432
  53%|█████▎ | 416/782 [03:48<03:18, 1.84it/s]
433
  53%|█████▎ | 417/782 [03:49<03:14, 1.88it/s]
434
  53%|█████▎ | 418/782 [03:49<03:21, 1.80it/s]
435
  54%|█████▎ | 419/782 [03:50<03:26, 1.76it/s]
436
  54%|█████▎ | 420/782 [03:50<03:18, 1.82it/s]
437
  54%|█████▍ | 421/782 [03:51<03:16, 1.84it/s]
438
  54%|█████▍ | 422/782 [03:51<03:13, 1.86it/s]
439
  54%|█████▍ | 423/782 [03:52<03:20, 1.79it/s]
440
  54%|█████▍ | 424/782 [03:53<03:14, 1.84it/s]
441
  54%|█████▍ | 425/782 [03:53<03:10, 1.88it/s]
442
  54%|█████▍ | 426/782 [03:54<03:13, 1.84it/s]
443
  55%|█████▍ | 427/782 [03:54<03:08, 1.88it/s]
444
  55%|█████▍ | 428/782 [03:55<03:08, 1.88it/s]
445
  55%|█████▍ | 429/782 [03:55<03:06, 1.89it/s]
446
  55%|█████▍ | 430/782 [03:56<03:08, 1.87it/s]
447
  55%|█████▌ | 431/782 [03:56<03:03, 1.91it/s]
448
  55%|█████▌ | 432/782 [03:57<03:07, 1.87it/s]
449
  55%|█████▌ | 433/782 [03:57<03:11, 1.82it/s]
450
  55%|█████▌ | 434/782 [03:58<03:05, 1.88it/s]
451
  56%|█████▌ | 435/782 [03:58<03:06, 1.86it/s]
452
  56%|█████▌ | 436/782 [03:59<03:14, 1.78it/s]
453
  56%|█████▌ | 437/782 [04:00<03:06, 1.85it/s]
454
  56%|█████▌ | 438/782 [04:00<03:04, 1.86it/s]
455
  56%|█████▌ | 439/782 [04:01<03:04, 1.86it/s]
456
  56%|█████▋ | 440/782 [04:01<03:00, 1.90it/s]
457
  56%|█████▋ | 441/782 [04:02<02:59, 1.90it/s]
458
  57%|█████▋ | 442/782 [04:02<03:02, 1.86it/s]
459
  57%|█████▋ | 443/782 [04:03<02:58, 1.90it/s]
460
  57%|█████▋ | 444/782 [04:03<02:59, 1.89it/s]
461
  57%|█████▋ | 445/782 [04:04<03:03, 1.83it/s]
462
  57%|█████▋ | 446/782 [04:04<02:53, 1.94it/s]
463
  57%|█████▋ | 447/782 [04:05<02:56, 1.90it/s]
464
  57%|█████▋ | 448/782 [04:05<03:00, 1.85it/s]
465
  57%|█████▋ | 449/782 [04:06<03:00, 1.85it/s]
466
  58%|█████▊ | 450/782 [04:06<02:56, 1.88it/s]
467
 
 
468
  58%|█████▊ | 450/782 [04:07<02:56, 1.88it/s]
469
  58%|█████▊ | 451/782 [04:07<02:53, 1.90it/s]
470
  58%|█████▊ | 452/782 [04:08<02:55, 1.88it/s]
471
  58%|█████▊ | 453/782 [04:08<02:49, 1.94it/s]
472
  58%|█████▊ | 454/782 [04:09<02:47, 1.96it/s]
473
  58%|█████▊ | 455/782 [04:09<02:48, 1.94it/s]
474
  58%|█████▊ | 456/782 [04:10<02:47, 1.95it/s]
475
  58%|█████▊ | 457/782 [04:10<02:46, 1.95it/s]
476
  59%|█████▊ | 458/782 [04:11<02:52, 1.88it/s]
477
  59%|█████▊ | 459/782 [04:11<02:56, 1.83it/s]
478
  59%|█████▉ | 460/782 [04:12<02:51, 1.88it/s]
479
  59%|█████▉ | 461/782 [04:12<02:52, 1.86it/s]
480
  59%|█████▉ | 462/782 [04:13<02:53, 1.85it/s]
481
  59%|█████▉ | 463/782 [04:13<02:51, 1.86it/s]
482
  59%|█████▉ | 464/782 [04:14<02:51, 1.85it/s]
483
  59%|█████▉ | 465/782 [04:14<02:47, 1.90it/s]
484
  60%|█████▉ | 466/782 [04:15<02:43, 1.94it/s]
485
  60%|█████▉ | 467/782 [04:15<02:43, 1.93it/s]
486
  60%|█████▉ | 468/782 [04:16<02:49, 1.85it/s]
487
  60%|█████▉ | 469/782 [04:16<02:40, 1.95it/s]
488
  60%|██████ | 470/782 [04:17<02:43, 1.91it/s]
489
  60%|██████ | 471/782 [04:18<02:45, 1.88it/s]
490
  60%|██████ | 472/782 [04:18<02:41, 1.92it/s]
491
  60%|██████ | 473/782 [04:19<02:42, 1.90it/s]
492
  61%|██████ | 474/782 [04:19<02:45, 1.86it/s]
493
  61%|██████ | 475/782 [04:20<02:39, 1.92it/s]
494
  61%|██████ | 476/782 [04:20<02:40, 1.91it/s]
495
  61%|██████ | 477/782 [04:21<02:40, 1.90it/s]
496
  61%|██████ | 478/782 [04:21<02:44, 1.85it/s]
497
  61%|██████▏ | 479/782 [04:22<02:41, 1.87it/s]
498
  61%|██████▏ | 480/782 [04:22<02:37, 1.91it/s]
499
  62%|██████▏ | 481/782 [04:23<02:41, 1.86it/s]
500
  62%|██████▏ | 482/782 [04:23<02:40, 1.87it/s]
501
  62%|██████▏ | 483/782 [04:24<02:37, 1.90it/s]
502
  62%|██████▏ | 484/782 [04:24<02:39, 1.87it/s]
503
  62%|██████▏ | 485/782 [04:25<02:42, 1.83it/s]
504
  62%|██████▏ | 486/782 [04:25<02:34, 1.92it/s]
505
  62%|██████▏ | 487/782 [04:26<02:35, 1.90it/s]
506
  62%|██████▏ | 488/782 [04:27<02:47, 1.76it/s]
507
  63%|██████▎ | 489/782 [04:27<02:38, 1.85it/s]
508
  63%|██████▎ | 490/782 [04:28<02:34, 1.89it/s]
509
  63%|██████▎ | 491/782 [04:28<02:33, 1.90it/s]
510
  63%|██████▎ | 492/782 [04:29<02:34, 1.88it/s]
511
  63%|██████▎ | 493/782 [04:29<02:30, 1.91it/s]
512
  63%|██████▎ | 494/782 [04:30<02:30, 1.91it/s]
513
  63%|██████▎ | 495/782 [04:30<02:30, 1.90it/s]
514
  63%|██████▎ | 496/782 [04:31<02:30, 1.90it/s]
515
  64%|██████▎ | 497/782 [04:31<02:28, 1.93it/s]
516
  64%|██████▎ | 498/782 [04:32<02:33, 1.85it/s]
517
  64%|██████▍ | 499/782 [04:32<02:33, 1.84it/s]
518
  64%|██████▍ | 500/782 [04:33<02:27, 1.91it/s]
519
 
 
520
  64%|██████▍ | 500/782 [04:33<02:27, 1.91it/s]
521
  64%|██████▍ | 501/782 [04:33<02:29, 1.88it/s]
522
  64%|██████▍ | 502/782 [04:34<02:29, 1.88it/s]
523
  64%|██████▍ | 503/782 [04:34<02:24, 1.93it/s]
524
  64%|██████▍ | 504/782 [04:35<02:27, 1.88it/s]
525
  65%|██████▍ | 505/782 [04:36<02:26, 1.89it/s]
526
  65%|██████▍ | 506/782 [04:36<02:23, 1.92it/s]
527
  65%|██████▍ | 507/782 [04:37<02:25, 1.88it/s]
528
  65%|██████▍ | 508/782 [04:37<02:26, 1.87it/s]
529
  65%|██████▌ | 509/782 [04:38<02:21, 1.93it/s]
530
  65%|██████▌ | 510/782 [04:38<02:22, 1.91it/s]
531
  65%|██████▌ | 511/782 [04:39<02:23, 1.89it/s]
532
  65%|██████▌ | 512/782 [04:39<02:27, 1.83it/s]
533
  66%|██████▌ | 513/782 [04:40<02:25, 1.85it/s]
534
  66%|██████▌ | 514/782 [04:40<02:21, 1.90it/s]
535
  66%|██████▌ | 515/782 [04:41<02:23, 1.86it/s]
536
  66%|██████▌ | 516/782 [04:41<02:27, 1.80it/s]
537
  66%|██████▌ | 517/782 [04:42<02:20, 1.88it/s]
538
  66%|██████▌ | 518/782 [04:43<02:21, 1.86it/s]
539
  66%|██████▋ | 519/782 [04:43<02:27, 1.78it/s]
540
  66%|██████▋ | 520/782 [04:44<02:20, 1.87it/s]
541
  67%|██████▋ | 521/782 [04:44<02:20, 1.86it/s]
542
  67%|██████▋ | 522/782 [04:45<02:21, 1.84it/s]
543
  67%|██████▋ | 523/782 [04:45<02:15, 1.91it/s]
544
  67%|██████▋ | 524/782 [04:46<02:15, 1.90it/s]
545
  67%|██████▋ | 525/782 [04:46<02:17, 1.86it/s]
546
  67%|██████▋ | 526/782 [04:47<02:11, 1.94it/s]
547
  67%|██████▋ | 527/782 [04:47<02:12, 1.92it/s]
548
  68%|██████▊ | 528/782 [04:48<02:16, 1.86it/s]
549
  68%|██████▊ | 529/782 [04:48<02:10, 1.94it/s]
550
  68%|██████▊ | 530/782 [04:49<02:09, 1.95it/s]
551
  68%|██████▊ | 531/782 [04:49<02:18, 1.81it/s]
552
  68%|██████▊ | 532/782 [04:50<02:18, 1.80it/s]
553
  68%|██████▊ | 533/782 [04:51<02:13, 1.86it/s]
554
  68%|██████▊ | 534/782 [04:51<02:11, 1.89it/s]
555
  68%|██████▊ | 535/782 [04:52<02:12, 1.87it/s]
556
  69%|██████▊ | 536/782 [04:52<02:15, 1.81it/s]
557
  69%|██████▊ | 537/782 [04:53<02:09, 1.89it/s]
558
  69%|██████▉ | 538/782 [04:53<02:08, 1.89it/s]
559
  69%|██████▉ | 539/782 [04:54<02:12, 1.84it/s]
560
  69%|██████▉ | 540/782 [04:54<02:08, 1.88it/s]
561
  69%|██████▉ | 541/782 [04:55<02:06, 1.91it/s]
562
  69%|██████▉ | 542/782 [04:55<02:07, 1.89it/s]
563
  69%|██████▉ | 543/782 [04:56<02:04, 1.92it/s]
564
  70%|██████▉ | 544/782 [04:56<02:02, 1.94it/s]
565
  70%|██████▉ | 545/782 [04:57<02:03, 1.92it/s]
566
  70%|██████▉ | 546/782 [04:57<02:05, 1.89it/s]
567
  70%|██████▉ | 547/782 [04:58<02:04, 1.88it/s]
568
  70%|███████ | 548/782 [04:58<02:04, 1.89it/s]
569
  70%|███████ | 549/782 [04:59<02:03, 1.88it/s]
570
  70%|███████ | 550/782 [05:00<02:02, 1.89it/s]
571
 
 
572
  70%|███████ | 550/782 [05:00<02:02, 1.89it/s]
573
  70%|███████ | 551/782 [05:00<02:03, 1.87it/s]
574
  71%|███████ | 552/782 [05:01<02:03, 1.86it/s]
575
  71%|███████ | 553/782 [05:01<02:03, 1.85it/s]
576
  71%|███████ | 554/782 [05:02<02:02, 1.86it/s]
577
  71%|███████ | 555/782 [05:02<02:01, 1.87it/s]
578
  71%|███████ | 556/782 [05:03<02:02, 1.85it/s]
579
  71%|███████ | 557/782 [05:03<02:08, 1.75it/s]
580
  71%|███████▏ | 558/782 [05:04<02:09, 1.73it/s]
581
  71%|███████▏ | 559/782 [05:05<02:08, 1.74it/s]
582
  72%|███████▏ | 560/782 [05:05<02:04, 1.79it/s]
583
  72%|███████▏ | 561/782 [05:06<02:09, 1.71it/s]
584
  72%|███████▏ | 562/782 [05:06<02:13, 1.65it/s]
585
  72%|███████▏ | 563/782 [05:07<02:19, 1.57it/s]
586
  72%|███████▏ | 564/782 [05:08<02:16, 1.59it/s]
587
  72%|███████▏ | 565/782 [05:08<02:17, 1.58it/s]
588
  72%|███████▏ | 566/782 [05:09<02:19, 1.55it/s]
589
  73%|███████▎ | 567/782 [05:10<02:18, 1.55it/s]
590
  73%|███████▎ | 568/782 [05:10<02:15, 1.58it/s]
591
  73%|███████▎ | 569/782 [05:11<02:20, 1.51it/s]
592
  73%|███████▎ | 570/782 [05:12<02:16, 1.55it/s]
593
  73%|███████▎ | 571/782 [05:12<02:16, 1.54it/s]
594
  73%|███████▎ | 572/782 [05:13<02:16, 1.54it/s]
595
  73%|███████▎ | 573/782 [05:14<02:19, 1.50it/s]
596
  73%|███████▎ | 574/782 [05:14<02:16, 1.53it/s]
597
  74%|███████▎ | 575/782 [05:15<02:15, 1.52it/s]
598
  74%|███████▎ | 576/782 [05:16<02:16, 1.50it/s]
599
  74%|███████▍ | 577/782 [05:16<02:15, 1.52it/s]
600
  74%|███████▍ | 578/782 [05:17<02:18, 1.47it/s]
601
  74%|███████▍ | 579/782 [05:18<02:12, 1.53it/s]
602
  74%|███████▍ | 580/782 [05:18<02:12, 1.53it/s]
603
  74%|███████▍ | 581/782 [05:19<02:15, 1.48it/s]
604
  74%|███████▍ | 582/782 [05:20<02:10, 1.53it/s]
605
  75%|███████▍ | 583/782 [05:20<02:11, 1.51it/s]
606
  75%|███████▍ | 584/782 [05:21<02:10, 1.51it/s]
607
  75%|███████▍ | 585/782 [05:22<02:07, 1.55it/s]
608
  75%|███████▍ | 586/782 [05:22<02:08, 1.53it/s]
609
  75%|███████▌ | 587/782 [05:23<02:11, 1.49it/s]
610
  75%|███████▌ | 588/782 [05:24<02:07, 1.52it/s]
611
  75%|███████▌ | 589/782 [05:24<02:09, 1.49it/s]
612
  75%|███████▌ | 590/782 [05:25<02:09, 1.49it/s]
613
  76%|███████▌ | 591/782 [05:26<02:05, 1.52it/s]
614
  76%|███████▌ | 592/782 [05:26<02:03, 1.54it/s]
615
  76%|███████▌ | 593/782 [05:27<02:01, 1.55it/s]
616
  76%|███████▌ | 594/782 [05:27<02:02, 1.53it/s]
617
  76%|███████▌ | 595/782 [05:28<02:01, 1.54it/s]
618
  76%|███████▌ | 596/782 [05:29<02:00, 1.54it/s]
619
  76%|███████▋ | 597/782 [05:29<02:01, 1.52it/s]
620
  76%|███████▋ | 598/782 [05:30<02:00, 1.53it/s]
621
  77%|███████▋ | 599/782 [05:31<01:56, 1.57it/s]
622
  77%|███████▋ | 600/782 [05:31<01:57, 1.54it/s]
623
 
 
624
  77%|███████▋ | 600/782 [05:31<01:57, 1.54it/s]
625
  77%|███████▋ | 601/782 [05:32<01:59, 1.52it/s]
626
  77%|███████▋ | 602/782 [05:33<01:56, 1.55it/s]
627
  77%|███████▋ | 603/782 [05:33<01:58, 1.51it/s]
628
  77%|███████▋ | 604/782 [05:34<02:01, 1.47it/s]
629
  77%|███████▋ | 605/782 [05:35<01:58, 1.49it/s]
630
  77%|███████▋ | 606/782 [05:35<01:55, 1.52it/s]
631
  78%|███████▊ | 607/782 [05:36<01:55, 1.51it/s]
632
  78%|███████▊ | 608/782 [05:37<01:50, 1.57it/s]
633
  78%|███████▊ | 609/782 [05:37<01:52, 1.54it/s]
634
  78%|███████▊ | 610/782 [05:38<01:57, 1.46it/s]
635
  78%|███████▊ | 611/782 [05:39<01:53, 1.51it/s]
636
  78%|███████▊ | 612/782 [05:39<01:55, 1.48it/s]
637
  78%|███████▊ | 613/782 [05:40<01:51, 1.52it/s]
638
  79%|███████▊ | 614/782 [05:41<01:48, 1.54it/s]
639
  79%|███████▊ | 615/782 [05:41<01:48, 1.54it/s]
640
  79%|███████▉ | 616/782 [05:42<01:51, 1.49it/s]
641
  79%|███████▉ | 617/782 [05:43<01:48, 1.53it/s]
642
  79%|███████▉ | 618/782 [05:43<01:50, 1.48it/s]
643
  79%|███████▉ | 619/782 [05:44<01:50, 1.48it/s]
644
  79%|███████▉ | 620/782 [05:45<01:48, 1.49it/s]
645
  79%|███████▉ | 621/782 [05:45<01:48, 1.48it/s]
646
  80%|███████▉ | 622/782 [05:46<01:47, 1.49it/s]
647
  80%|███████▉ | 623/782 [05:47<01:43, 1.54it/s]
648
  80%|███████▉ | 624/782 [05:47<01:42, 1.53it/s]
649
  80%|███████▉ | 625/782 [05:48<01:42, 1.53it/s]
650
  80%|████████ | 626/782 [05:49<01:42, 1.52it/s]
651
  80%|████████ | 627/782 [05:49<01:43, 1.50it/s]
652
  80%|████████ | 628/782 [05:50<01:42, 1.51it/s]
653
  80%|████████ | 629/782 [05:51<01:38, 1.56it/s]
654
  81%|████████ | 630/782 [05:51<01:43, 1.46it/s]
655
  81%|████████ | 631/782 [05:52<01:41, 1.48it/s]
656
  81%|████████ | 632/782 [05:52<01:33, 1.61it/s]
657
  81%|████████ | 633/782 [05:53<01:28, 1.69it/s]
658
  81%|████████ | 634/782 [05:54<01:27, 1.69it/s]
659
  81%|████████ | 635/782 [05:54<01:22, 1.78it/s]
660
  81%|████████▏ | 636/782 [05:55<01:22, 1.77it/s]
661
  81%|████████▏ | 637/782 [05:55<01:23, 1.73it/s]
662
  82%|████████▏ | 638/782 [05:56<01:21, 1.77it/s]
663
  82%|████████▏ | 639/782 [05:56<01:18, 1.82it/s]
664
  82%|████████▏ | 640/782 [05:57<01:18, 1.81it/s]
665
  82%|████████▏ | 641/782 [05:57<01:17, 1.83it/s]
666
  82%|████████▏ | 642/782 [05:58<01:14, 1.87it/s]
667
  82%|████████▏ | 643/782 [05:58<01:15, 1.85it/s]
668
  82%|████████▏ | 644/782 [05:59<01:14, 1.86it/s]
669
  82%|████████▏ | 645/782 [06:00<01:13, 1.85it/s]
670
  83%|████████▎ | 646/782 [06:00<01:13, 1.85it/s]
671
  83%|████████▎ | 647/782 [06:01<01:14, 1.82it/s]
672
  83%|████████▎ | 648/782 [06:01<01:11, 1.86it/s]
673
  83%|████████▎ | 649/782 [06:02<01:10, 1.88it/s]
674
  83%|████████▎ | 650/782 [06:02<01:11, 1.85it/s]
675
 
 
676
  83%|████████▎ | 650/782 [06:02<01:11, 1.85it/s]
677
  83%|████████▎ | 651/782 [06:03<01:10, 1.87it/s]
678
  83%|████████▎ | 652/782 [06:03<01:08, 1.89it/s]
679
  84%|████████▎ | 653/782 [06:04<01:11, 1.81it/s]
680
  84%|████████▎ | 654/782 [06:04<01:10, 1.83it/s]
681
  84%|████████▍ | 655/782 [06:05<01:07, 1.88it/s]
682
  84%|████████▍ | 656/782 [06:05<01:09, 1.83it/s]
683
  84%|████████▍ | 657/782 [06:06<01:08, 1.81it/s]
684
  84%|████████▍ | 658/782 [06:07<01:06, 1.88it/s]
685
  84%|████████▍ | 659/782 [06:07<01:06, 1.85it/s]
686
  84%|████████▍ | 660/782 [06:08<01:08, 1.79it/s]
687
  85%|████████▍ | 661/782 [06:08<01:04, 1.87it/s]
688
  85%|████████▍ | 662/782 [06:09<01:04, 1.86it/s]
689
  85%|████████▍ | 663/782 [06:09<01:05, 1.81it/s]
690
  85%|████████▍ | 664/782 [06:10<01:03, 1.86it/s]
691
  85%|████████▌ | 665/782 [06:10<01:03, 1.86it/s]
692
  85%|████████▌ | 666/782 [06:11<01:05, 1.78it/s]
693
  85%|████████▌ | 667/782 [06:11<01:01, 1.88it/s]
694
  85%|████████▌ | 668/782 [06:12<01:00, 1.88it/s]
695
  86%|████████▌ | 669/782 [06:12<01:00, 1.87it/s]
696
  86%|████████▌ | 670/782 [06:13<00:59, 1.88it/s]
697
  86%|████████▌ | 671/782 [06:14<00:58, 1.90it/s]
698
  86%|████████▌ | 672/782 [06:14<00:57, 1.92it/s]
699
  86%|████████▌ | 673/782 [06:15<00:58, 1.88it/s]
700
  86%|████████▌ | 674/782 [06:15<00:56, 1.90it/s]
701
  86%|████████▋ | 675/782 [06:16<00:55, 1.92it/s]
702
  86%|████████▋ | 676/782 [06:16<00:58, 1.82it/s]
703
  87%|████████▋ | 677/782 [06:17<00:58, 1.79it/s]
704
  87%|████████▋ | 678/782 [06:17<00:55, 1.88it/s]
705
  87%|████████▋ | 679/782 [06:18<00:55, 1.86it/s]
706
  87%|████████▋ | 680/782 [06:18<00:57, 1.77it/s]
707
  87%|████████▋ | 681/782 [06:19<00:53, 1.88it/s]
708
  87%|████████▋ | 682/782 [06:19<00:54, 1.84it/s]
709
  87%|████████▋ | 683/782 [06:20<00:54, 1.81it/s]
710
  87%|████████▋ | 684/782 [06:21<00:51, 1.90it/s]
711
  88%|████████��� | 685/782 [06:21<00:52, 1.85it/s]
712
  88%|████████▊ | 686/782 [06:22<00:52, 1.83it/s]
713
  88%|████████▊ | 687/782 [06:22<00:50, 1.89it/s]
714
  88%|████████▊ | 688/782 [06:23<00:49, 1.88it/s]
715
  88%|████████▊ | 689/782 [06:23<00:49, 1.89it/s]
716
  88%|████████▊ | 690/782 [06:24<00:49, 1.87it/s]
717
  88%|████████▊ | 691/782 [06:24<00:48, 1.89it/s]
718
  88%|████████▊ | 692/782 [06:25<00:47, 1.90it/s]
719
  89%|████████▊ | 693/782 [06:25<00:46, 1.90it/s]
720
  89%|████████▊ | 694/782 [06:26<00:46, 1.90it/s]
721
  89%|████████▉ | 695/782 [06:26<00:47, 1.84it/s]
722
  89%|████████▉ | 696/782 [06:27<00:45, 1.89it/s]
723
  89%|████████▉ | 697/782 [06:27<00:45, 1.87it/s]
724
  89%|████████▉ | 698/782 [06:28<00:44, 1.88it/s]
725
  89%|████████▉ | 699/782 [06:29<00:44, 1.85it/s]
726
  90%|████████▉ | 700/782 [06:29<00:43, 1.88it/s]
727
 
 
728
  90%|████████▉ | 700/782 [06:29<00:43, 1.88it/s]
729
  90%|████████▉ | 701/782 [06:30<00:43, 1.87it/s]
730
  90%|████████▉ | 702/782 [06:30<00:44, 1.80it/s]
731
  90%|████████▉ | 703/782 [06:31<00:44, 1.79it/s]
732
  90%|█████████ | 704/782 [06:31<00:41, 1.86it/s]
733
  90%|█████████ | 705/782 [06:32<00:41, 1.84it/s]
734
  90%|█████████ | 706/782 [06:32<00:40, 1.87it/s]
735
  90%|█████████ | 707/782 [06:33<00:39, 1.89it/s]
736
  91%|█████████ | 708/782 [06:33<00:39, 1.89it/s]
737
  91%|█████████ | 709/782 [06:34<00:38, 1.89it/s]
738
  91%|█████████ | 710/782 [06:34<00:39, 1.83it/s]
739
  91%|█████████ | 711/782 [06:35<00:38, 1.86it/s]
740
  91%|█████████ | 712/782 [06:36<00:37, 1.88it/s]
741
  91%|█████████ | 713/782 [06:36<00:37, 1.84it/s]
742
  91%|█████████▏| 714/782 [06:37<00:37, 1.82it/s]
743
  91%|█████████▏| 715/782 [06:37<00:35, 1.87it/s]
744
  92%|█████████▏| 716/782 [06:38<00:35, 1.86it/s]
745
  92%|█████████▏| 717/782 [06:38<00:35, 1.84it/s]
746
  92%|█████████▏| 718/782 [06:39<00:34, 1.87it/s]
747
  92%|█████████▏| 719/782 [06:39<00:33, 1.86it/s]
748
  92%|█████████▏| 720/782 [06:40<00:33, 1.87it/s]
749
  92%|█████████▏| 721/782 [06:40<00:32, 1.87it/s]
750
  92%|█████████▏| 722/782 [06:41<00:31, 1.91it/s]
751
  92%|█████████▏| 723/782 [06:41<00:30, 1.91it/s]
752
  93%|█████████▎| 724/782 [06:42<00:31, 1.84it/s]
753
  93%|█████████▎| 725/782 [06:43<00:31, 1.82it/s]
754
  93%|█████████▎| 726/782 [06:43<00:31, 1.77it/s]
755
  93%|█████████▎| 727/782 [06:44<00:30, 1.80it/s]
756
  93%|█████████▎| 728/782 [06:44<00:29, 1.81it/s]
757
  93%|█████████▎| 729/782 [06:45<00:29, 1.82it/s]
758
  93%|█████████▎| 730/782 [06:45<00:28, 1.85it/s]
759
  93%|█████████▎| 731/782 [06:46<00:27, 1.86it/s]
760
  94%|█████████▎| 732/782 [06:46<00:27, 1.85it/s]
761
  94%|█████████▎| 733/782 [06:47<00:26, 1.88it/s]
762
  94%|█████████▍| 734/782 [06:47<00:25, 1.86it/s]
763
  94%|█████████▍| 735/782 [06:48<00:25, 1.85it/s]
764
  94%|█████████▍| 736/782 [06:49<00:24, 1.88it/s]
765
  94%|█████████▍| 737/782 [06:49<00:23, 1.89it/s]
766
  94%|█████████▍| 738/782 [06:50<00:23, 1.88it/s]
767
  95%|█████████▍| 739/782 [06:50<00:22, 1.90it/s]
768
  95%|█████████▍| 740/782 [06:51<00:22, 1.90it/s]
769
  95%|█████████▍| 741/782 [06:51<00:22, 1.85it/s]
770
  95%|█████████▍| 742/782 [06:52<00:21, 1.89it/s]
771
  95%|█████████▌| 743/782 [06:52<00:20, 1.91it/s]
772
  95%|█████████▌| 744/782 [06:53<00:20, 1.84it/s]
773
  95%|█████████▌| 745/782 [06:53<00:19, 1.88it/s]
774
  95%|█████████▌| 746/782 [06:54<00:19, 1.88it/s]
775
  96%|█████████▌| 747/782 [06:54<00:19, 1.83it/s]
776
  96%|█████████▌| 748/782 [06:55<00:18, 1.82it/s]
777
  96%|█████████▌| 749/782 [06:55<00:17, 1.86it/s]
778
  96%|█████████▌| 750/782 [06:56<00:17, 1.81it/s]
779
 
 
780
  96%|█████████▌| 750/782 [06:56<00:17, 1.81it/s]
781
  96%|█████████▌| 751/782 [06:57<00:17, 1.73it/s]
782
  96%|█████████▌| 752/782 [06:57<00:16, 1.82it/s]
783
  96%|█████████▋| 753/782 [06:58<00:15, 1.83it/s]
784
  96%|█████████▋| 754/782 [06:58<00:15, 1.80it/s]
785
  97%|█████████▋| 755/782 [06:59<00:14, 1.82it/s]
786
  97%|█████████▋| 756/782 [06:59<00:14, 1.83it/s]
787
  97%|█████████▋| 757/782 [07:00<00:13, 1.82it/s]
788
  97%|█████████▋| 758/782 [07:00<00:13, 1.80it/s]
789
  97%|█████████▋| 759/782 [07:01<00:12, 1.83it/s]
790
  97%|█████████▋| 760/782 [07:02<00:11, 1.89it/s]
791
  97%|█████████▋| 761/782 [07:02<00:11, 1.90it/s]
792
  97%|█████████▋| 762/782 [07:03<00:10, 1.90it/s]
793
  98%|█████████▊| 763/782 [07:03<00:09, 1.91it/s]
794
  98%|█████████▊| 764/782 [07:04<00:09, 1.89it/s]
795
  98%|█████████▊| 765/782 [07:04<00:09, 1.88it/s]
796
  98%|█████████▊| 766/782 [07:05<00:08, 1.86it/s]
797
  98%|█████████▊| 767/782 [07:05<00:08, 1.85it/s]
798
  98%|█████████▊| 768/782 [07:06<00:07, 1.87it/s]
799
  98%|█████████▊| 769/782 [07:06<00:06, 1.87it/s]
800
  98%|█████████▊| 770/782 [07:07<00:06, 1.86it/s]
801
  99%|█████████▊| 771/782 [07:07<00:05, 1.90it/s]
802
  99%|█████████▊| 772/782 [07:08<00:05, 1.92it/s]
803
  99%|█████████▉| 773/782 [07:08<00:04, 1.85it/s]
804
  99%|█████████▉| 774/782 [07:09<00:04, 1.85it/s]
805
  99%|█████████▉| 775/782 [07:09<00:03, 1.91it/s]
806
  99%|█████████▉| 776/782 [07:10<00:03, 1.90it/s]
807
  99%|█████████▉| 777/782 [07:11<00:02, 1.90it/s]
808
  99%|█████████▉| 778/782 [07:11<00:02, 1.92it/s]
809
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [2025-05-13 01:08:08] Created output directory: train_results/google_t5-v1_1-large_ds100_upsample1000
2
+ [2025-05-13 01:08:08] Chat mode disabled
3
+ [2025-05-13 01:08:08] Model size is 3B or smaller (0 B). Using full fine-tuning.
4
+ [2025-05-13 01:08:08] Adjusted parameters for t5 model:
5
+ [2025-05-13 01:08:08] - LEARNING_RATE: 1e-4
6
+ [2025-05-13 01:08:08] - BATCH_SIZE: 64
7
+ [2025-05-13 01:08:08] - GRADIENT_ACCUMULATION_STEPS: 1
8
+ [2025-05-13 01:08:08] No QA format data will be used
9
+ [2025-05-13 01:08:08] Limiting dataset size to: 100 samples
10
+ [2025-05-13 01:08:08] =======================================
11
+ [2025-05-13 01:08:08] Starting training for model: google/t5-v1_1-large
12
+ [2025-05-13 01:08:08] =======================================
13
+ [2025-05-13 01:08:08] CUDA_VISIBLE_DEVICES: 2,3
14
+ [2025-05-13 01:08:08] WANDB_PROJECT: wikidyk-ar
15
+ [2025-05-13 01:08:08] DATA_PATH: data/wikidyk2022-2025_01082025_gpt-4o_evalv2_pages_formatted_combined_v2.json
16
+ [2025-05-13 01:08:08] Global Batch Size: 128
17
+ [2025-05-13 01:08:08] Data Size: 100
18
+ [2025-05-13 01:08:08] Executing command: torchrun --nproc_per_node "2" --master-port 29501 src/train.py --model_name_or_path "google/t5-v1_1-large" --data_path "data/wikidyk2022-2025_01082025_gpt-4o_evalv2_pages_formatted_combined_v2.json" --output_dir "train_results/google_t5-v1_1-large_ds100_upsample1000" --num_upsample "1000" --per_device_train_batch_size "64" --gradient_accumulation_steps "1" --learning_rate "1e-4" --num_train_epochs "1" --model_max_length "32768" --report_to wandb --logging_steps 50 --save_strategy no --bf16 True --use_flash_attention_2 True --qa_data_ratio "-1" --predict_mask "false" --ds_size 100
19
+ [2025-05-13 01:08:08] Training started at Tue May 13 01:08:08 UTC 2025
20
+ W0513 01:08:10.171000 443637 site-packages/torch/distributed/run.py:792]
21
+ W0513 01:08:10.171000 443637 site-packages/torch/distributed/run.py:792] *****************************************
22
+ W0513 01:08:10.171000 443637 site-packages/torch/distributed/run.py:792] Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed.
23
+ W0513 01:08:10.171000 443637 site-packages/torch/distributed/run.py:792] *****************************************
24
+ WARNING:root:Output directory: train_results/google_t5-v1_1-large_ds100_upsample1000
25
+ WARNING:root:Output directory: train_results/google_t5-v1_1-large_ds100_upsample1000
26
+ You are using the default legacy behaviour of the <class 'transformers.models.t5.tokenization_t5.T5Tokenizer'>. This is expected, and simply means that the `legacy` (previous) behavior will be used so nothing changes for you. If you want to use the new behaviour, set `legacy=False`. This should only be set if you understand what it means, and thoroughly read the reason why this was added as explained in https://github.com/huggingface/transformers/pull/24565
27
+ You are using the default legacy behaviour of the <class 'transformers.models.t5.tokenization_t5.T5Tokenizer'>. This is expected, and simply means that the `legacy` (previous) behavior will be used so nothing changes for you. If you want to use the new behaviour, set `legacy=False`. This should only be set if you understand what it means, and thoroughly read the reason why this was added as explained in https://github.com/huggingface/transformers/pull/24565
28
+ WARNING:root:Loading data...
29
+ WARNING:root:Loading data...
30
+ WARNING:root:Dataset initialized with all QA data:
31
+ WARNING:root: - 0 QA examples
32
+ WARNING:root: - 100 fact examples with upsampling factor 1000
33
+ WARNING:root: - Total examples: 100000
34
+ WARNING:root:Dataset initialized with all QA data:
35
+ WARNING:root: - 0 QA examples
36
+ WARNING:root: - 100 fact examples with upsampling factor 1000
37
+ WARNING:root: - Total examples: 100000
38
+ /root/yuwei/WikiDYKEvalV2/src/train.py:119: FutureWarning: `tokenizer` is deprecated and will be removed in version 5.0.0 for `Trainer.__init__`. Use `processing_class` instead.
39
+ trainer = Trainer(model=model, tokenizer=tokenizer, args=training_args, **data_module)
40
+ /root/yuwei/WikiDYKEvalV2/src/train.py:119: FutureWarning: `tokenizer` is deprecated and will be removed in version 5.0.0 for `Trainer.__init__`. Use `processing_class` instead.
41
+ trainer = Trainer(model=model, tokenizer=tokenizer, args=training_args, **data_module)
42
+ wandb: WARNING The `run_name` is currently set to the same value as `TrainingArguments.output_dir`. If this was not intended, please specify a different run name by setting the `TrainingArguments.run_name` parameter.
43
+ /root/miniconda3/envs/wikidyk/lib/python3.10/site-packages/transformers/tokenization_utils_base.py:3980: UserWarning: `as_target_tokenizer` is deprecated and will be removed in v5 of Transformers. You can tokenize your labels by using the argument `text_target` of the regular `__call__` method (either in the same call as your input texts if you use the same keyword arguments, or in a separate call.
44
+ warnings.warn(
45
+ wandb: Currently logged in as: yuweiz to https://api.wandb.ai. Use `wandb login --relogin` to force relogin
46
+ Passing a tuple of `past_key_values` is deprecated and will be removed in Transformers v4.48.0. You should pass an instance of `EncoderDecoderCache` instead, e.g. `past_key_values=EncoderDecoderCache.from_legacy_cache(past_key_values)`.
47
+ [rank1]:[W513 01:08:40.694530638 reducer.cpp:1400] Warning: find_unused_parameters=True was specified in DDP constructor, but did not find any unused parameters in the forward pass. This flag results in an extra traversal of the autograd graph every iteration, which can adversely affect performance. If your model indeed never has any unused parameters in the forward pass, consider turning this flag off. Note that this warning may be a false positive if your model has flow control causing later iterations to have unused parameters. (function operator())
48
+ wandb: Tracking run with wandb version 0.19.11
49
+ wandb: Run data is saved locally in /root/yuwei/WikiDYKEvalV2/wandb/run-20250513_010840-ovxz0tx6
50
+ wandb: Run `wandb offline` to turn off syncing.
51
+ wandb: Syncing run train_results/google_t5-v1_1-large_ds100_upsample1000
52
+ wandb: ⭐️ View project at https://wandb.ai/yuweiz/wikidyk-ar
53
+ wandb: 🚀 View run at https://wandb.ai/yuweiz/wikidyk-ar/runs/ovxz0tx6
54
+
55
  0%| | 0/782 [00:00<?, ?it/s]/root/miniconda3/envs/wikidyk/lib/python3.10/site-packages/transformers/tokenization_utils_base.py:3980: UserWarning: `as_target_tokenizer` is deprecated and will be removed in v5 of Transformers. You can tokenize your labels by using the argument `text_target` of the regular `__call__` method (either in the same call as your input texts if you use the same keyword arguments, or in a separate call.
56
+ warnings.warn(
57
+ Passing a tuple of `past_key_values` is deprecated and will be removed in Transformers v4.48.0. You should pass an instance of `EncoderDecoderCache` instead, e.g. `past_key_values=EncoderDecoderCache.from_legacy_cache(past_key_values)`.
58
+ [rank0]:[W513 01:08:40.426723468 reducer.cpp:1400] Warning: find_unused_parameters=True was specified in DDP constructor, but did not find any unused parameters in the forward pass. This flag results in an extra traversal of the autograd graph every iteration, which can adversely affect performance. If your model indeed never has any unused parameters in the forward pass, consider turning this flag off. Note that this warning may be a false positive if your model has flow control causing later iterations to have unused parameters. (function operator())
59
+
60
  0%| | 1/782 [00:00<11:29, 1.13it/s]
61
  0%| | 2/782 [00:02<15:37, 1.20s/it]
62
  0%| | 3/782 [00:02<11:24, 1.14it/s]
63
  1%| | 4/782 [00:03<09:45, 1.33it/s]
64
  1%| | 5/782 [00:03<08:53, 1.46it/s]
65
  1%| | 6/782 [00:04<07:57, 1.62it/s]
66
  1%| | 7/782 [00:05<10:15, 1.26it/s]
67
  1%| | 8/782 [00:06<09:03, 1.42it/s]
68
  1%| | 9/782 [00:06<08:31, 1.51it/s]
69
  1%|▏ | 10/782 [00:07<08:10, 1.57it/s]
70
  1%|▏ | 11/782 [00:07<07:35, 1.69it/s]
71
  2%|▏ | 12/782 [00:08<07:17, 1.76it/s]
72
  2%|▏ | 13/782 [00:08<07:22, 1.74it/s]
73
  2%|▏ | 14/782 [00:09<07:07, 1.80it/s]
74
  2%|▏ | 15/782 [00:09<06:59, 1.83it/s]
75
  2%|▏ | 16/782 [00:10<06:50, 1.87it/s]
76
  2%|▏ | 17/782 [00:10<06:54, 1.85it/s]
77
  2%|▏ | 18/782 [00:11<06:49, 1.87it/s]
78
  2%|▏ | 19/782 [00:11<06:42, 1.90it/s]
79
  3%|▎ | 20/782 [00:12<06:51, 1.85it/s]
80
  3%|▎ | 21/782 [00:13<06:52, 1.85it/s]
81
  3%|▎ | 22/782 [00:13<06:37, 1.91it/s]
82
  3%|▎ | 23/782 [00:14<06:56, 1.82it/s]
83
  3%|▎ | 24/782 [00:14<06:59, 1.81it/s]
84
  3%|▎ | 25/782 [00:15<06:37, 1.90it/s]
85
  3%|▎ | 26/782 [00:15<06:40, 1.89it/s]
86
  3%|▎ | 27/782 [00:16<06:50, 1.84it/s]
87
  4%|▎ | 28/782 [00:16<06:48, 1.85it/s]
88
  4%|▎ | 29/782 [00:17<06:40, 1.88it/s]
89
  4%|▍ | 30/782 [00:17<06:41, 1.87it/s]
90
  4%|▍ | 31/782 [00:18<06:38, 1.89it/s]
91
  4%|▍ | 32/782 [00:18<06:35, 1.89it/s]
92
  4%|▍ | 33/782 [00:19<06:40, 1.87it/s]
93
  4%|▍ | 34/782 [00:19<06:34, 1.89it/s]
94
  4%|▍ | 35/782 [00:20<06:34, 1.90it/s]
95
  5%|▍ | 36/782 [00:21<06:40, 1.86it/s]
96
  5%|▍ | 37/782 [00:21<06:29, 1.91it/s]
97
  5%|▍ | 38/782 [00:22<08:52, 1.40it/s]
98
  5%|▍ | 39/782 [00:23<08:07, 1.52it/s]
99
  5%|▌ | 40/782 [00:23<07:41, 1.61it/s]
100
  5%|▌ | 41/782 [00:24<07:14, 1.71it/s]
101
  5%|▌ | 42/782 [00:24<06:50, 1.80it/s]
102
  5%|▌ | 43/782 [00:25<06:53, 1.79it/s]
103
  6%|▌ | 44/782 [00:25<07:05, 1.74it/s]
104
  6%|▌ | 45/782 [00:26<06:50, 1.80it/s]
105
  6%|▌ | 46/782 [00:27<06:47, 1.81it/s]
106
  6%|▌ | 47/782 [00:27<06:47, 1.80it/s]
107
  6%|▌ | 48/782 [00:28<06:53, 1.78it/s]
108
  6%|▋ | 49/782 [00:28<06:33, 1.86it/s]
109
  6%|▋ | 50/782 [00:29<06:33, 1.86it/s]
110
 
111
+
112
  6%|▋ | 50/782 [00:29<06:33, 1.86it/s]
113
  7%|▋ | 51/782 [00:29<06:53, 1.77it/s]
114
  7%|▋ | 52/782 [00:30<06:49, 1.78it/s]
115
  7%|▋ | 53/782 [00:30<06:34, 1.85it/s]
116
  7%|▋ | 54/782 [00:31<06:31, 1.86it/s]
117
  7%|▋ | 55/782 [00:32<06:50, 1.77it/s]
118
  7%|▋ | 56/782 [00:32<06:42, 1.80it/s]
119
  7%|▋ | 57/782 [00:33<06:32, 1.85it/s]
120
  7%|▋ | 58/782 [00:33<06:25, 1.88it/s]
121
  8%|▊ | 59/782 [00:34<06:32, 1.84it/s]
122
  8%|▊ | 60/782 [00:34<06:28, 1.86it/s]
123
  8%|▊ | 61/782 [00:35<06:18, 1.90it/s]
124
  8%|▊ | 62/782 [00:36<08:41, 1.38it/s]
125
  8%|▊ | 63/782 [00:36<08:00, 1.50it/s]
126
  8%|▊ | 64/782 [00:37<07:31, 1.59it/s]
127
  8%|▊ | 65/782 [00:37<06:59, 1.71it/s]
128
  8%|▊ | 66/782 [00:38<06:56, 1.72it/s]
129
  9%|▊ | 67/782 [00:39<06:52, 1.73it/s]
130
  9%|▊ | 68/782 [00:39<06:35, 1.81it/s]
131
  9%|▉ | 69/782 [00:40<06:38, 1.79it/s]
132
  9%|▉ | 70/782 [00:40<06:58, 1.70it/s]
133
  9%|▉ | 71/782 [00:41<06:36, 1.79it/s]
134
  9%|▉ | 72/782 [00:41<06:26, 1.84it/s]
135
  9%|▉ | 73/782 [00:42<06:22, 1.85it/s]
136
  9%|▉ | 74/782 [00:42<06:24, 1.84it/s]
137
  10%|▉ | 75/782 [00:43<06:24, 1.84it/s]
138
  10%|▉ | 76/782 [00:43<06:30, 1.81it/s]
139
  10%|▉ | 77/782 [00:44<06:43, 1.75it/s]
140
  10%|▉ | 78/782 [00:45<06:40, 1.76it/s]
141
  10%|█ | 79/782 [00:45<06:28, 1.81it/s]
142
  10%|█ | 80/782 [00:46<06:27, 1.81it/s]
143
  10%|█ | 81/782 [00:46<06:33, 1.78it/s]
144
  10%|█ | 82/782 [00:47<06:17, 1.85it/s]
145
  11%|█ | 83/782 [00:47<06:09, 1.89it/s]
146
  11%|█ | 84/782 [00:48<06:09, 1.89it/s]
147
  11%|█ | 85/782 [00:48<06:16, 1.85it/s]
148
  11%|█ | 86/782 [00:49<06:16, 1.85it/s]
149
  11%|█ | 87/782 [00:49<06:07, 1.89it/s]
150
  11%|█▏ | 88/782 [00:50<06:10, 1.87it/s]
151
  11%|█▏ | 89/782 [00:50<06:07, 1.89it/s]
152
  12%|█▏ | 90/782 [00:51<06:02, 1.91it/s]
153
  12%|█▏ | 91/782 [00:52<06:33, 1.76it/s]
154
  12%|█▏ | 92/782 [00:53<09:21, 1.23it/s]
155
  12%|█▏ | 93/782 [00:54<08:28, 1.35it/s]
156
  12%|█▏ | 94/782 [00:54<07:33, 1.52it/s]
157
  12%|█▏ | 95/782 [00:55<07:15, 1.58it/s]
158
  12%|█▏ | 96/782 [00:55<07:19, 1.56it/s]
159
  12%|█▏ | 97/782 [00:56<06:48, 1.68it/s]
160
  13%|█▎ | 98/782 [00:56<06:40, 1.71it/s]
161
  13%|█▎ | 99/782 [00:57<06:28, 1.76it/s]
162
  13%|█▎ | 100/782 [00:57<06:23, 1.78it/s]
163
 
164
+
165
  13%|█▎ | 100/782 [00:58<06:23, 1.78it/s]
166
  13%|█▎ | 101/782 [00:58<06:15, 1.81it/s]
167
  13%|█▎ | 102/782 [00:59<06:08, 1.84it/s]
168
  13%|█▎ | 103/782 [00:59<06:12, 1.82it/s]
169
  13%|█▎ | 104/782 [01:00<06:14, 1.81it/s]
170
  13%|█▎ | 105/782 [01:00<06:01, 1.87it/s]
171
  14%|█▎ | 106/782 [01:01<05:58, 1.88it/s]
172
  14%|█▎ | 107/782 [01:01<06:06, 1.84it/s]
173
  14%|█▍ | 108/782 [01:02<05:53, 1.91it/s]
174
  14%|█▍ | 109/782 [01:02<05:59, 1.87it/s]
175
  14%|█▍ | 110/782 [01:03<06:05, 1.84it/s]
176
  14%|█▍ | 111/782 [01:03<05:54, 1.89it/s]
177
  14%|█▍ | 112/782 [01:04<05:57, 1.87it/s]
178
  14%|█▍ | 113/782 [01:04<06:02, 1.85it/s]
179
  15%|█▍ | 114/782 [01:05<05:52, 1.89it/s]
180
  15%|█▍ | 115/782 [01:05<05:59, 1.85it/s]
181
  15%|█▍ | 116/782 [01:06<06:02, 1.84it/s]
182
  15%|█▍ | 117/782 [01:07<05:49, 1.90it/s]
183
  15%|█▌ | 118/782 [01:07<05:57, 1.86it/s]
184
  15%|█▌ | 119/782 [01:08<06:02, 1.83it/s]
185
  15%|█▌ | 120/782 [01:08<05:54, 1.87it/s]
186
  15%|█▌ | 121/782 [01:09<05:52, 1.88it/s]
187
  16%|█▌ | 122/782 [01:09<06:00, 1.83it/s]
188
  16%|█▌ | 123/782 [01:10<05:54, 1.86it/s]
189
  16%|█▌ | 124/782 [01:10<05:49, 1.89it/s]
190
  16%|█▌ | 125/782 [01:11<05:45, 1.90it/s]
191
  16%|█▌ | 126/782 [01:11<05:49, 1.88it/s]
192
  16%|█▌ | 127/782 [01:12<05:41, 1.92it/s]
193
  16%|█▋ | 128/782 [01:12<05:33, 1.96it/s]
194
  16%|█▋ | 129/782 [01:13<05:43, 1.90it/s]
195
  17%|█▋ | 130/782 [01:13<05:48, 1.87it/s]
196
  17%|█▋ | 131/782 [01:14<05:36, 1.94it/s]
197
  17%|█▋ | 132/782 [01:14<05:44, 1.89it/s]
198
  17%|█▋ | 133/782 [01:15<05:58, 1.81it/s]
199
  17%|█▋ | 134/782 [01:16<05:47, 1.87it/s]
200
  17%|█▋ | 135/782 [01:16<05:53, 1.83it/s]
201
  17%|█▋ | 136/782 [01:17<06:16, 1.72it/s]
202
  18%|█▊ | 137/782 [01:17<05:56, 1.81it/s]
203
  18%|█▊ | 138/782 [01:18<05:55, 1.81it/s]
204
  18%|█▊ | 139/782 [01:18<06:02, 1.77it/s]
205
  18%|█▊ | 140/782 [01:19<05:45, 1.86it/s]
206
  18%|█▊ | 141/782 [01:19<05:41, 1.88it/s]
207
  18%|█▊ | 142/782 [01:20<05:41, 1.88it/s]
208
  18%|█▊ | 143/782 [01:20<05:35, 1.91it/s]
209
  18%|█▊ | 144/782 [01:21<05:34, 1.91it/s]
210
  19%|█▊ | 145/782 [01:22<05:32, 1.92it/s]
211
  19%|█▊ | 146/782 [01:22<05:53, 1.80it/s]
212
  19%|█▉ | 147/782 [01:23<05:42, 1.86it/s]
213
  19%|█▉ | 148/782 [01:23<05:40, 1.86it/s]
214
  19%|█▉ | 149/782 [01:24<05:44, 1.84it/s]
215
  19%|█▉ | 150/782 [01:24<05:44, 1.84it/s]
216
 
217
+
218
  19%|█▉ | 150/782 [01:24<05:44, 1.84it/s]
219
  19%|█▉ | 151/782 [01:25<05:36, 1.87it/s]
220
  19%|█▉ | 152/782 [01:25<05:39, 1.86it/s]
221
  20%|█▉ | 153/782 [01:26<05:49, 1.80it/s]
222
  20%|█▉ | 154/782 [01:26<05:34, 1.88it/s]
223
  20%|█▉ | 155/782 [01:27<05:42, 1.83it/s]
224
  20%|█▉ | 156/782 [01:28<05:57, 1.75it/s]
225
  20%|██ | 157/782 [01:28<05:43, 1.82it/s]
226
  20%|██ | 158/782 [01:29<05:38, 1.85it/s]
227
  20%|██ | 159/782 [01:29<05:47, 1.79it/s]
228
  20%|██ | 160/782 [01:30<05:37, 1.84it/s]
229
  21%|██ | 161/782 [01:30<05:37, 1.84it/s]
230
  21%|██ | 162/782 [01:31<05:53, 1.75it/s]
231
  21%|██ | 163/782 [01:31<05:43, 1.80it/s]
232
  21%|██ | 164/782 [01:32<05:34, 1.85it/s]
233
  21%|██ | 165/782 [01:32<05:27, 1.88it/s]
234
  21%|██ | 166/782 [01:33<05:31, 1.86it/s]
235
  21%|██▏ | 167/782 [01:34<05:51, 1.75it/s]
236
  21%|██▏ | 168/782 [01:34<05:29, 1.86it/s]
237
  22%|██▏ | 169/782 [01:35<05:31, 1.85it/s]
238
  22%|██▏ | 170/782 [01:35<05:39, 1.80it/s]
239
  22%|██▏ | 171/782 [01:36<05:23, 1.89it/s]
240
  22%|██▏ | 172/782 [01:36<05:27, 1.86it/s]
241
  22%|██▏ | 173/782 [01:37<05:29, 1.85it/s]
242
  22%|██▏ | 174/782 [01:37<05:31, 1.84it/s]
243
  22%|██▏ | 175/782 [01:38<05:23, 1.88it/s]
244
  23%|██▎ | 176/782 [01:38<05:26, 1.86it/s]
245
  23%|██▎ | 177/782 [01:39<05:23, 1.87it/s]
246
  23%|██▎ | 178/782 [01:40<05:23, 1.86it/s]
247
  23%|██▎ | 179/782 [01:40<05:17, 1.90it/s]
248
  23%|██▎ | 180/782 [01:41<05:24, 1.86it/s]
249
  23%|██▎ | 181/782 [01:41<05:21, 1.87it/s]
250
  23%|██▎ | 182/782 [01:42<05:21, 1.87it/s]
251
  23%|██▎ | 183/782 [01:42<05:22, 1.86it/s]
252
  24%|██▎ | 184/782 [01:43<05:19, 1.87it/s]
253
  24%|██▎ | 185/782 [01:43<05:20, 1.86it/s]
254
  24%|██▍ | 186/782 [01:44<05:28, 1.82it/s]
255
  24%|██▍ | 187/782 [01:44<05:18, 1.87it/s]
256
  24%|██▍ | 188/782 [01:45<05:15, 1.89it/s]
257
  24%|██▍ | 189/782 [01:45<05:16, 1.87it/s]
258
  24%|██▍ | 190/782 [01:46<05:16, 1.87it/s]
259
  24%|██▍ | 191/782 [01:46<05:12, 1.89it/s]
260
  25%|██▍ | 192/782 [01:47<05:29, 1.79it/s]
261
  25%|██▍ | 193/782 [01:48<05:26, 1.81it/s]
262
  25%|██▍ | 194/782 [01:48<05:18, 1.84it/s]
263
  25%|██▍ | 195/782 [01:49<05:22, 1.82it/s]
264
  25%|██▌ | 196/782 [01:49<05:20, 1.83it/s]
265
  25%|██▌ | 197/782 [01:50<05:10, 1.88it/s]
266
  25%|██▌ | 198/782 [01:50<05:15, 1.85it/s]
267
  25%|██▌ | 199/782 [01:51<05:31, 1.76it/s]
268
  26%|██▌ | 200/782 [01:51<05:20, 1.81it/s]
269
 
270
+
271
  26%|██▌ | 200/782 [01:52<05:20, 1.81it/s]
272
  26%|██▌ | 201/782 [01:52<05:17, 1.83it/s]
273
  26%|██▌ | 202/782 [01:53<05:25, 1.78it/s]
274
  26%|██▌ | 203/782 [01:53<05:12, 1.85it/s]
275
  26%|██▌ | 204/782 [01:54<05:13, 1.84it/s]
276
  26%|██▌ | 205/782 [01:54<05:23, 1.79it/s]
277
  26%|██▋ | 206/782 [01:55<05:07, 1.87it/s]
278
  26%|██▋ | 207/782 [01:55<05:09, 1.86it/s]
279
  27%|██▋ | 208/782 [01:56<05:20, 1.79it/s]
280
  27%|██▋ | 209/782 [01:56<05:12, 1.83it/s]
281
  27%|██▋ | 210/782 [01:57<05:05, 1.87it/s]
282
  27%|██▋ | 211/782 [01:57<05:03, 1.88it/s]
283
  27%|██▋ | 212/782 [01:58<05:05, 1.86it/s]
284
  27%|██▋ | 213/782 [01:59<05:15, 1.80it/s]
285
  27%|██▋ | 214/782 [01:59<05:02, 1.88it/s]
286
  27%|██▋ | 215/782 [02:00<05:07, 1.85it/s]
287
  28%|██▊ | 216/782 [02:00<05:14, 1.80it/s]
288
  28%|██▊ | 217/782 [02:01<05:02, 1.87it/s]
289
  28%|██▊ | 218/782 [02:01<05:03, 1.86it/s]
290
  28%|██▊ | 219/782 [02:02<05:09, 1.82it/s]
291
  28%|██▊ | 220/782 [02:02<04:59, 1.88it/s]
292
  28%|██▊ | 221/782 [02:03<04:57, 1.89it/s]
293
  28%|██▊ | 222/782 [02:03<04:51, 1.92it/s]
294
  29%|██▊ | 223/782 [02:04<04:56, 1.89it/s]
295
  29%|██▊ | 224/782 [02:04<04:56, 1.88it/s]
296
  29%|██▉ | 225/782 [02:05<04:48, 1.93it/s]
297
  29%|██▉ | 226/782 [02:05<04:55, 1.88it/s]
298
  29%|██▉ | 227/782 [02:06<05:02, 1.83it/s]
299
  29%|██▉ | 228/782 [02:07<04:53, 1.89it/s]
300
  29%|██▉ | 229/782 [02:07<04:54, 1.87it/s]
301
  29%|██▉ | 230/782 [02:08<05:09, 1.78it/s]
302
  30%|██▉ | 231/782 [02:08<04:57, 1.85it/s]
303
  30%|██▉ | 232/782 [02:09<04:58, 1.84it/s]
304
  30%|██▉ | 233/782 [02:09<05:01, 1.82it/s]
305
  30%|██▉ | 234/782 [02:10<04:59, 1.83it/s]
306
  30%|███ | 235/782 [02:10<04:55, 1.85it/s]
307
  30%|███ | 236/782 [02:11<04:54, 1.85it/s]
308
  30%|███ | 237/782 [02:11<04:55, 1.84it/s]
309
  30%|███ | 238/782 [02:12<04:45, 1.90it/s]
310
  31%|███ | 239/782 [02:12<04:47, 1.89it/s]
311
  31%|███ | 240/782 [02:13<04:52, 1.86it/s]
312
  31%|███ | 241/782 [02:14<04:54, 1.84it/s]
313
  31%|███ | 242/782 [02:14<04:39, 1.93it/s]
314
  31%|███ | 243/782 [02:15<04:43, 1.90it/s]
315
  31%|███ | 244/782 [02:15<05:08, 1.74it/s]
316
  31%|███▏ | 245/782 [02:16<04:53, 1.83it/s]
317
  31%|███▏ | 246/782 [02:16<04:51, 1.84it/s]
318
  32%|███▏ | 247/782 [02:17<04:48, 1.86it/s]
319
  32%|███▏ | 248/782 [02:17<04:54, 1.81it/s]
320
  32%|███▏ | 249/782 [02:18<04:53, 1.82it/s]
321
  32%|███▏ | 250/782 [02:18<04:40, 1.90it/s]
322
 
323
+
324
  32%|███▏ | 250/782 [02:19<04:40, 1.90it/s]
325
  32%|███▏ | 251/782 [02:19<04:45, 1.86it/s]
326
  32%|███▏ | 252/782 [02:20<04:51, 1.82it/s]
327
  32%|███▏ | 253/782 [02:20<04:42, 1.87it/s]
328
  32%|███▏ | 254/782 [02:21<04:40, 1.88it/s]
329
  33%|███▎ | 255/782 [02:21<04:39, 1.89it/s]
330
  33%|███▎ | 256/782 [02:22<04:37, 1.90it/s]
331
  33%|███▎ | 257/782 [02:22<04:34, 1.91it/s]
332
  33%|███▎ | 258/782 [02:23<04:36, 1.89it/s]
333
  33%|███▎ | 259/782 [02:23<04:45, 1.83it/s]
334
  33%|███▎ | 260/782 [02:24<04:37, 1.88it/s]
335
  33%|███▎ | 261/782 [02:24<04:31, 1.92it/s]
336
  34%|███▎ | 262/782 [02:25<04:36, 1.88it/s]
337
  34%|███▎ | 263/782 [02:25<04:38, 1.86it/s]
338
  34%|███▍ | 264/782 [02:26<04:37, 1.87it/s]
339
  34%|███▍ | 265/782 [02:26<04:40, 1.84it/s]
340
  34%|███▍ | 266/782 [02:27<04:33, 1.89it/s]
341
  34%|███▍ | 267/782 [02:28<04:37, 1.86it/s]
342
  34%|███▍ | 268/782 [02:28<04:43, 1.81it/s]
343
  34%|███▍ | 269/782 [02:29<04:47, 1.78it/s]
344
  35%|███▍ | 270/782 [02:29<04:36, 1.85it/s]
345
  35%|███▍ | 271/782 [02:30<04:40, 1.82it/s]
346
  35%|███▍ | 272/782 [02:30<04:49, 1.76it/s]
347
  35%|███▍ | 273/782 [02:31<04:37, 1.84it/s]
348
  35%|███▌ | 274/782 [02:31<04:35, 1.84it/s]
349
  35%|███▌ | 275/782 [02:32<04:41, 1.80it/s]
350
  35%|███▌ | 276/782 [02:32<04:30, 1.87it/s]
351
  35%|███▌ | 277/782 [02:33<04:35, 1.83it/s]
352
  36%|███▌ | 278/782 [02:34<04:34, 1.84it/s]
353
  36%|███▌ | 279/782 [02:34<04:33, 1.84it/s]
354
  36%|███▌ | 280/782 [02:35<04:33, 1.84it/s]
355
  36%|███▌ | 281/782 [02:35<04:36, 1.81it/s]
356
  36%|███▌ | 282/782 [02:36<04:26, 1.88it/s]
357
  36%|███▌ | 283/782 [02:36<04:29, 1.85it/s]
358
  36%|███▋ | 284/782 [02:37<04:38, 1.79it/s]
359
  36%|███▋ | 285/782 [02:37<04:29, 1.85it/s]
360
  37%|███▋ | 286/782 [02:38<04:30, 1.83it/s]
361
  37%|███▋ | 287/782 [02:38<04:28, 1.85it/s]
362
  37%|███▋ | 288/782 [02:39<04:22, 1.88it/s]
363
  37%|███▋ | 289/782 [02:40<04:24, 1.87it/s]
364
  37%|███▋ | 290/782 [02:40<04:41, 1.75it/s]
365
  37%|███▋ | 291/782 [02:41<04:33, 1.80it/s]
366
  37%|███▋ | 292/782 [02:41<04:29, 1.82it/s]
367
  37%|███▋ | 293/782 [02:42<04:37, 1.76it/s]
368
  38%|███▊ | 294/782 [02:42<04:24, 1.85it/s]
369
  38%|███▊ | 295/782 [02:43<04:26, 1.83it/s]
370
  38%|███▊ | 296/782 [02:43<04:32, 1.78it/s]
371
  38%|███▊ | 297/782 [02:44<04:26, 1.82it/s]
372
  38%|███▊ | 298/782 [02:44<04:17, 1.88it/s]
373
  38%|███▊ | 299/782 [02:45<04:18, 1.87it/s]
374
  38%|███▊ | 300/782 [02:46<04:16, 1.88it/s]
375
 
376
+
377
  38%|███▊ | 300/782 [02:46<04:16, 1.88it/s]
378
  38%|███▊ | 301/782 [02:46<04:18, 1.86it/s]
379
  39%|███▊ | 302/782 [02:47<04:18, 1.86it/s]
380
  39%|███▊ | 303/782 [02:47<04:20, 1.84it/s]
381
  39%|███▉ | 304/782 [02:48<04:19, 1.84it/s]
382
  39%|███▉ | 305/782 [02:48<04:13, 1.88it/s]
383
  39%|██���▉ | 306/782 [02:49<04:16, 1.86it/s]
384
  39%|███▉ | 307/782 [02:49<04:10, 1.89it/s]
385
  39%|███▉ | 308/782 [02:50<04:10, 1.89it/s]
386
  40%|███▉ | 309/782 [02:50<04:11, 1.88it/s]
387
  40%|███▉ | 310/782 [02:51<04:09, 1.89it/s]
388
  40%|███▉ | 311/782 [02:51<04:07, 1.90it/s]
389
  40%|███▉ | 312/782 [02:52<04:08, 1.89it/s]
390
  40%|████ | 313/782 [02:52<04:09, 1.88it/s]
391
  40%|████ | 314/782 [02:53<04:08, 1.88it/s]
392
  40%|████ | 315/782 [02:54<04:15, 1.83it/s]
393
  40%|████ | 316/782 [02:54<04:13, 1.84it/s]
394
  41%|████ | 317/782 [02:55<04:07, 1.88it/s]
395
  41%|████ | 318/782 [02:55<04:06, 1.88it/s]
396
  41%|████ | 319/782 [02:56<04:03, 1.90it/s]
397
  41%|████ | 320/782 [02:56<04:00, 1.92it/s]
398
  41%|████ | 321/782 [02:57<04:05, 1.87it/s]
399
  41%|████ | 322/782 [02:57<04:09, 1.84it/s]
400
  41%|████▏ | 323/782 [02:58<04:05, 1.87it/s]
401
  41%|████▏ | 324/782 [02:58<04:04, 1.88it/s]
402
  42%|████▏ | 325/782 [02:59<04:05, 1.86it/s]
403
  42%|████▏ | 326/782 [02:59<04:01, 1.89it/s]
404
  42%|████▏ | 327/782 [03:00<03:59, 1.90it/s]
405
  42%|████▏ | 328/782 [03:01<04:06, 1.84it/s]
406
  42%|████▏ | 329/782 [03:01<04:02, 1.86it/s]
407
  42%|████▏ | 330/782 [03:02<04:00, 1.88it/s]
408
  42%|████▏ | 331/782 [03:02<03:59, 1.88it/s]
409
  42%|████▏ | 332/782 [03:03<04:12, 1.78it/s]
410
  43%|████▎ | 333/782 [03:03<04:09, 1.80it/s]
411
  43%|████▎ | 334/782 [03:04<04:01, 1.86it/s]
412
  43%|████▎ | 335/782 [03:04<04:05, 1.82it/s]
413
  43%|████▎ | 336/782 [03:05<04:19, 1.72it/s]
414
  43%|████▎ | 337/782 [03:05<04:03, 1.83it/s]
415
  43%|████▎ | 338/782 [03:06<04:02, 1.83it/s]
416
  43%|████▎ | 339/782 [03:07<03:59, 1.85it/s]
417
  43%|████▎ | 340/782 [03:07<03:50, 1.91it/s]
418
  44%|████▎ | 341/782 [03:08<03:51, 1.90it/s]
419
  44%|████▎ | 342/782 [03:08<03:55, 1.87it/s]
420
  44%|████▍ | 343/782 [03:09<03:53, 1.88it/s]
421
  44%|████▍ | 344/782 [03:09<03:48, 1.91it/s]
422
  44%|████▍ | 345/782 [03:10<03:48, 1.92it/s]
423
  44%|████▍ | 346/782 [03:10<03:54, 1.86it/s]
424
  44%|████▍ | 347/782 [03:11<03:55, 1.85it/s]
425
  45%|████▍ | 348/782 [03:11<03:51, 1.88it/s]
426
  45%|████▍ | 349/782 [03:12<04:01, 1.79it/s]
427
  45%|████▍ | 350/782 [03:12<04:02, 1.78it/s]
428
 
429
+
430
  45%|████▍ | 350/782 [03:13<04:02, 1.78it/s]
431
  45%|████▍ | 351/782 [03:13<03:53, 1.84it/s]
432
  45%|████▌ | 352/782 [03:14<03:51, 1.86it/s]
433
  45%|████▌ | 353/782 [03:14<03:58, 1.80it/s]
434
  45%|████▌ | 354/782 [03:15<03:48, 1.88it/s]
435
  45%|████▌ | 355/782 [03:15<03:50, 1.86it/s]
436
  46%|████▌ | 356/782 [03:16<03:48, 1.86it/s]
437
  46%|████▌ | 357/782 [03:16<03:38, 1.95it/s]
438
  46%|████▌ | 358/782 [03:17<03:45, 1.88it/s]
439
  46%|████▌ | 359/782 [03:17<03:51, 1.83it/s]
440
  46%|████▌ | 360/782 [03:18<03:46, 1.86it/s]
441
  46%|████▌ | 361/782 [03:18<03:53, 1.81it/s]
442
  46%|████▋ | 362/782 [03:19<03:55, 1.78it/s]
443
  46%|████▋ | 363/782 [03:19<03:48, 1.84it/s]
444
  47%|████▋ | 364/782 [03:20<03:48, 1.83it/s]
445
  47%|████▋ | 365/782 [03:21<03:49, 1.82it/s]
446
  47%|████▋ | 366/782 [03:21<03:40, 1.89it/s]
447
  47%|████▋ | 367/782 [03:22<03:36, 1.92it/s]
448
  47%|████▋ | 368/782 [03:22<03:40, 1.88it/s]
449
  47%|████▋ | 369/782 [03:23<03:34, 1.92it/s]
450
  47%|████▋ | 370/782 [03:23<03:33, 1.93it/s]
451
  47%|████▋ | 371/782 [03:24<03:34, 1.92it/s]
452
  48%|████▊ | 372/782 [03:24<03:40, 1.86it/s]
453
  48%|████▊ | 373/782 [03:25<03:38, 1.87it/s]
454
  48%|████▊ | 374/782 [03:25<03:35, 1.89it/s]
455
  48%|████▊ | 375/782 [03:26<03:37, 1.87it/s]
456
  48%|████▊ | 376/782 [03:26<03:35, 1.88it/s]
457
  48%|████▊ | 377/782 [03:27<03:34, 1.89it/s]
458
  48%|████▊ | 378/782 [03:27<03:35, 1.88it/s]
459
  48%|████▊ | 379/782 [03:28<03:31, 1.91it/s]
460
  49%|████▊ | 380/782 [03:28<03:29, 1.91it/s]
461
  49%|████▊ | 381/782 [03:29<03:36, 1.85it/s]
462
  49%|████▉ | 382/782 [03:30<03:49, 1.74it/s]
463
  49%|████▉ | 383/782 [03:30<03:38, 1.83it/s]
464
  49%|████▉ | 384/782 [03:31<03:41, 1.79it/s]
465
  49%|████▉ | 385/782 [03:31<03:44, 1.77it/s]
466
  49%|████▉ | 386/782 [03:32<03:45, 1.76it/s]
467
  49%|████▉ | 387/782 [03:32<03:39, 1.80it/s]
468
  50%|████▉ | 388/782 [03:33<03:33, 1.84it/s]
469
  50%|████▉ | 389/782 [03:33<03:33, 1.84it/s]
470
  50%|████▉ | 390/782 [03:34<03:38, 1.79it/s]
471
  50%|█████ | 391/782 [03:35<03:28, 1.87it/s]
472
  50%|█████ | 392/782 [03:35<03:35, 1.81it/s]
473
  50%|█████ | 393/782 [03:36<03:48, 1.70it/s]
474
  50%|█████ | 394/782 [03:36<03:35, 1.80it/s]
475
  51%|█████ | 395/782 [03:37<03:34, 1.81it/s]
476
  51%|█████ | 396/782 [03:37<03:34, 1.80it/s]
477
  51%|█████ | 397/782 [03:38<03:31, 1.82it/s]
478
  51%|█████ | 398/782 [03:38<03:28, 1.84it/s]
479
  51%|█████ | 399/782 [03:39<03:31, 1.81it/s]
480
  51%|█████ | 400/782 [03:40<03:24, 1.87it/s]
481
 
482
+
483
  51%|█████ | 400/782 [03:40<03:24, 1.87it/s]
484
  51%|█████▏ | 401/782 [03:40<03:27, 1.84it/s]
485
  51%|█████▏ | 402/782 [03:41<03:33, 1.78it/s]
486
  52%|█████▏ | 403/782 [03:41<03:23, 1.86it/s]
487
  52%|█████▏ | 404/782 [03:42<03:23, 1.86it/s]
488
  52%|█████▏ | 405/782 [03:42<03:30, 1.79it/s]
489
  52%|█████▏ | 406/782 [03:43<03:20, 1.87it/s]
490
  52%|█████▏ | 407/782 [03:43<03:19, 1.88it/s]
491
  52%|█████▏ | 408/782 [03:44<03:23, 1.83it/s]
492
  52%|█████▏ | 409/782 [03:44<03:17, 1.89it/s]
493
  52%|█████▏ | 410/782 [03:45<03:16, 1.89it/s]
494
  53%|█████▎ | 411/782 [03:46<03:20, 1.85it/s]
495
  53%|█████▎ | 412/782 [03:46<03:22, 1.83it/s]
496
  53%|█████▎ | 413/782 [03:47<03:17, 1.87it/s]
497
  53%|█████▎ | 414/782 [03:47<03:14, 1.89it/s]
498
  53%|█████▎ | 415/782 [03:48<03:17, 1.86it/s]
499
  53%|█████▎ | 416/782 [03:48<03:18, 1.84it/s]
500
  53%|█████▎ | 417/782 [03:49<03:14, 1.88it/s]
501
  53%|█████▎ | 418/782 [03:49<03:21, 1.80it/s]
502
  54%|█████▎ | 419/782 [03:50<03:26, 1.76it/s]
503
  54%|█████▎ | 420/782 [03:50<03:18, 1.82it/s]
504
  54%|█████▍ | 421/782 [03:51<03:16, 1.84it/s]
505
  54%|█████▍ | 422/782 [03:51<03:13, 1.86it/s]
506
  54%|█████▍ | 423/782 [03:52<03:20, 1.79it/s]
507
  54%|█████▍ | 424/782 [03:53<03:14, 1.84it/s]
508
  54%|█████▍ | 425/782 [03:53<03:10, 1.88it/s]
509
  54%|█████▍ | 426/782 [03:54<03:13, 1.84it/s]
510
  55%|█████▍ | 427/782 [03:54<03:08, 1.88it/s]
511
  55%|█████▍ | 428/782 [03:55<03:08, 1.88it/s]
512
  55%|█████▍ | 429/782 [03:55<03:06, 1.89it/s]
513
  55%|█████▍ | 430/782 [03:56<03:08, 1.87it/s]
514
  55%|█████▌ | 431/782 [03:56<03:03, 1.91it/s]
515
  55%|█████▌ | 432/782 [03:57<03:07, 1.87it/s]
516
  55%|█████▌ | 433/782 [03:57<03:11, 1.82it/s]
517
  55%|█████▌ | 434/782 [03:58<03:05, 1.88it/s]
518
  56%|█████▌ | 435/782 [03:58<03:06, 1.86it/s]
519
  56%|█████▌ | 436/782 [03:59<03:14, 1.78it/s]
520
  56%|█████▌ | 437/782 [04:00<03:06, 1.85it/s]
521
  56%|█████▌ | 438/782 [04:00<03:04, 1.86it/s]
522
  56%|█████▌ | 439/782 [04:01<03:04, 1.86it/s]
523
  56%|█████▋ | 440/782 [04:01<03:00, 1.90it/s]
524
  56%|█████▋ | 441/782 [04:02<02:59, 1.90it/s]
525
  57%|█████▋ | 442/782 [04:02<03:02, 1.86it/s]
526
  57%|█████▋ | 443/782 [04:03<02:58, 1.90it/s]
527
  57%|█████▋ | 444/782 [04:03<02:59, 1.89it/s]
528
  57%|█████▋ | 445/782 [04:04<03:03, 1.83it/s]
529
  57%|█████▋ | 446/782 [04:04<02:53, 1.94it/s]
530
  57%|█████▋ | 447/782 [04:05<02:56, 1.90it/s]
531
  57%|█████▋ | 448/782 [04:05<03:00, 1.85it/s]
532
  57%|█████▋ | 449/782 [04:06<03:00, 1.85it/s]
533
  58%|█████▊ | 450/782 [04:06<02:56, 1.88it/s]
534
 
535
+
536
  58%|█████▊ | 450/782 [04:07<02:56, 1.88it/s]
537
  58%|█████▊ | 451/782 [04:07<02:53, 1.90it/s]
538
  58%|█████▊ | 452/782 [04:08<02:55, 1.88it/s]
539
  58%|█████▊ | 453/782 [04:08<02:49, 1.94it/s]
540
  58%|█████▊ | 454/782 [04:09<02:47, 1.96it/s]
541
  58%|█████▊ | 455/782 [04:09<02:48, 1.94it/s]
542
  58%|█████▊ | 456/782 [04:10<02:47, 1.95it/s]
543
  58%|█████▊ | 457/782 [04:10<02:46, 1.95it/s]
544
  59%|█████▊ | 458/782 [04:11<02:52, 1.88it/s]
545
  59%|█████▊ | 459/782 [04:11<02:56, 1.83it/s]
546
  59%|█████▉ | 460/782 [04:12<02:51, 1.88it/s]
547
  59%|█████▉ | 461/782 [04:12<02:52, 1.86it/s]
548
  59%|█████▉ | 462/782 [04:13<02:53, 1.85it/s]
549
  59%|█████▉ | 463/782 [04:13<02:51, 1.86it/s]
550
  59%|█████▉ | 464/782 [04:14<02:51, 1.85it/s]
551
  59%|█████▉ | 465/782 [04:14<02:47, 1.90it/s]
552
  60%|█████▉ | 466/782 [04:15<02:43, 1.94it/s]
553
  60%|█████▉ | 467/782 [04:15<02:43, 1.93it/s]
554
  60%|█████▉ | 468/782 [04:16<02:49, 1.85it/s]
555
  60%|█████▉ | 469/782 [04:16<02:40, 1.95it/s]
556
  60%|██████ | 470/782 [04:17<02:43, 1.91it/s]
557
  60%|██████ | 471/782 [04:18<02:45, 1.88it/s]
558
  60%|██████ | 472/782 [04:18<02:41, 1.92it/s]
559
  60%|██████ | 473/782 [04:19<02:42, 1.90it/s]
560
  61%|██████ | 474/782 [04:19<02:45, 1.86it/s]
561
  61%|██████ | 475/782 [04:20<02:39, 1.92it/s]
562
  61%|██████ | 476/782 [04:20<02:40, 1.91it/s]
563
  61%|██████ | 477/782 [04:21<02:40, 1.90it/s]
564
  61%|██████ | 478/782 [04:21<02:44, 1.85it/s]
565
  61%|██████▏ | 479/782 [04:22<02:41, 1.87it/s]
566
  61%|██████▏ | 480/782 [04:22<02:37, 1.91it/s]
567
  62%|██████▏ | 481/782 [04:23<02:41, 1.86it/s]
568
  62%|██████▏ | 482/782 [04:23<02:40, 1.87it/s]
569
  62%|██████▏ | 483/782 [04:24<02:37, 1.90it/s]
570
  62%|██████▏ | 484/782 [04:24<02:39, 1.87it/s]
571
  62%|██████▏ | 485/782 [04:25<02:42, 1.83it/s]
572
  62%|██████▏ | 486/782 [04:25<02:34, 1.92it/s]
573
  62%|██████▏ | 487/782 [04:26<02:35, 1.90it/s]
574
  62%|██████▏ | 488/782 [04:27<02:47, 1.76it/s]
575
  63%|██████▎ | 489/782 [04:27<02:38, 1.85it/s]
576
  63%|██████▎ | 490/782 [04:28<02:34, 1.89it/s]
577
  63%|██████▎ | 491/782 [04:28<02:33, 1.90it/s]
578
  63%|██████▎ | 492/782 [04:29<02:34, 1.88it/s]
579
  63%|██████▎ | 493/782 [04:29<02:30, 1.91it/s]
580
  63%|██████▎ | 494/782 [04:30<02:30, 1.91it/s]
581
  63%|██████▎ | 495/782 [04:30<02:30, 1.90it/s]
582
  63%|██████▎ | 496/782 [04:31<02:30, 1.90it/s]
583
  64%|██████▎ | 497/782 [04:31<02:28, 1.93it/s]
584
  64%|██████▎ | 498/782 [04:32<02:33, 1.85it/s]
585
  64%|██████▍ | 499/782 [04:32<02:33, 1.84it/s]
586
  64%|██████▍ | 500/782 [04:33<02:27, 1.91it/s]
587
 
588
+
589
  64%|██████▍ | 500/782 [04:33<02:27, 1.91it/s]
590
  64%|██████▍ | 501/782 [04:33<02:29, 1.88it/s]
591
  64%|██████▍ | 502/782 [04:34<02:29, 1.88it/s]
592
  64%|██████▍ | 503/782 [04:34<02:24, 1.93it/s]
593
  64%|██████▍ | 504/782 [04:35<02:27, 1.88it/s]
594
  65%|██████▍ | 505/782 [04:36<02:26, 1.89it/s]
595
  65%|██████▍ | 506/782 [04:36<02:23, 1.92it/s]
596
  65%|██████▍ | 507/782 [04:37<02:25, 1.88it/s]
597
  65%|██████▍ | 508/782 [04:37<02:26, 1.87it/s]
598
  65%|██████▌ | 509/782 [04:38<02:21, 1.93it/s]
599
  65%|██████▌ | 510/782 [04:38<02:22, 1.91it/s]
600
  65%|██████▌ | 511/782 [04:39<02:23, 1.89it/s]
601
  65%|██████▌ | 512/782 [04:39<02:27, 1.83it/s]
602
  66%|██████▌ | 513/782 [04:40<02:25, 1.85it/s]
603
  66%|██████▌ | 514/782 [04:40<02:21, 1.90it/s]
604
  66%|██████▌ | 515/782 [04:41<02:23, 1.86it/s]
605
  66%|██████▌ | 516/782 [04:41<02:27, 1.80it/s]
606
  66%|██████▌ | 517/782 [04:42<02:20, 1.88it/s]
607
  66%|██████▌ | 518/782 [04:43<02:21, 1.86it/s]
608
  66%|██████▋ | 519/782 [04:43<02:27, 1.78it/s]
609
  66%|██████▋ | 520/782 [04:44<02:20, 1.87it/s]
610
  67%|██████▋ | 521/782 [04:44<02:20, 1.86it/s]
611
  67%|██████▋ | 522/782 [04:45<02:21, 1.84it/s]
612
  67%|██████▋ | 523/782 [04:45<02:15, 1.91it/s]
613
  67%|██████▋ | 524/782 [04:46<02:15, 1.90it/s]
614
  67%|██████▋ | 525/782 [04:46<02:17, 1.86it/s]
615
  67%|██████▋ | 526/782 [04:47<02:11, 1.94it/s]
616
  67%|██████▋ | 527/782 [04:47<02:12, 1.92it/s]
617
  68%|██████▊ | 528/782 [04:48<02:16, 1.86it/s]
618
  68%|██████▊ | 529/782 [04:48<02:10, 1.94it/s]
619
  68%|██████▊ | 530/782 [04:49<02:09, 1.95it/s]
620
  68%|██████▊ | 531/782 [04:49<02:18, 1.81it/s]
621
  68%|██████▊ | 532/782 [04:50<02:18, 1.80it/s]
622
  68%|██████▊ | 533/782 [04:51<02:13, 1.86it/s]
623
  68%|██████▊ | 534/782 [04:51<02:11, 1.89it/s]
624
  68%|██████▊ | 535/782 [04:52<02:12, 1.87it/s]
625
  69%|██████▊ | 536/782 [04:52<02:15, 1.81it/s]
626
  69%|██████▊ | 537/782 [04:53<02:09, 1.89it/s]
627
  69%|██████▉ | 538/782 [04:53<02:08, 1.89it/s]
628
  69%|██████▉ | 539/782 [04:54<02:12, 1.84it/s]
629
  69%|██████▉ | 540/782 [04:54<02:08, 1.88it/s]
630
  69%|██████▉ | 541/782 [04:55<02:06, 1.91it/s]
631
  69%|██████▉ | 542/782 [04:55<02:07, 1.89it/s]
632
  69%|██████▉ | 543/782 [04:56<02:04, 1.92it/s]
633
  70%|██████▉ | 544/782 [04:56<02:02, 1.94it/s]
634
  70%|██████▉ | 545/782 [04:57<02:03, 1.92it/s]
635
  70%|██████▉ | 546/782 [04:57<02:05, 1.89it/s]
636
  70%|██████▉ | 547/782 [04:58<02:04, 1.88it/s]
637
  70%|███████ | 548/782 [04:58<02:04, 1.89it/s]
638
  70%|███████ | 549/782 [04:59<02:03, 1.88it/s]
639
  70%|███████ | 550/782 [05:00<02:02, 1.89it/s]
640
 
641
+
642
  70%|███████ | 550/782 [05:00<02:02, 1.89it/s]
643
  70%|███████ | 551/782 [05:00<02:03, 1.87it/s]
644
  71%|███████ | 552/782 [05:01<02:03, 1.86it/s]
645
  71%|███████ | 553/782 [05:01<02:03, 1.85it/s]
646
  71%|███████ | 554/782 [05:02<02:02, 1.86it/s]
647
  71%|███████ | 555/782 [05:02<02:01, 1.87it/s]
648
  71%|███████ | 556/782 [05:03<02:02, 1.85it/s]
649
  71%|███████ | 557/782 [05:03<02:08, 1.75it/s]
650
  71%|███████▏ | 558/782 [05:04<02:09, 1.73it/s]
651
  71%|███████▏ | 559/782 [05:05<02:08, 1.74it/s]
652
  72%|███████▏ | 560/782 [05:05<02:04, 1.79it/s]
653
  72%|███████▏ | 561/782 [05:06<02:09, 1.71it/s]
654
  72%|███████▏ | 562/782 [05:06<02:13, 1.65it/s]
655
  72%|███████▏ | 563/782 [05:07<02:19, 1.57it/s]
656
  72%|███████▏ | 564/782 [05:08<02:16, 1.59it/s]
657
  72%|███████▏ | 565/782 [05:08<02:17, 1.58it/s]
658
  72%|███████▏ | 566/782 [05:09<02:19, 1.55it/s]
659
  73%|███████▎ | 567/782 [05:10<02:18, 1.55it/s]
660
  73%|███████▎ | 568/782 [05:10<02:15, 1.58it/s]
661
  73%|███████▎ | 569/782 [05:11<02:20, 1.51it/s]
662
  73%|███████▎ | 570/782 [05:12<02:16, 1.55it/s]
663
  73%|███████▎ | 571/782 [05:12<02:16, 1.54it/s]
664
  73%|███████▎ | 572/782 [05:13<02:16, 1.54it/s]
665
  73%|███████▎ | 573/782 [05:14<02:19, 1.50it/s]
666
  73%|███████▎ | 574/782 [05:14<02:16, 1.53it/s]
667
  74%|███████▎ | 575/782 [05:15<02:15, 1.52it/s]
668
  74%|███████▎ | 576/782 [05:16<02:16, 1.50it/s]
669
  74%|███████▍ | 577/782 [05:16<02:15, 1.52it/s]
670
  74%|███████▍ | 578/782 [05:17<02:18, 1.47it/s]
671
  74%|███████▍ | 579/782 [05:18<02:12, 1.53it/s]
672
  74%|███████▍ | 580/782 [05:18<02:12, 1.53it/s]
673
  74%|███████▍ | 581/782 [05:19<02:15, 1.48it/s]
674
  74%|███████▍ | 582/782 [05:20<02:10, 1.53it/s]
675
  75%|███████▍ | 583/782 [05:20<02:11, 1.51it/s]
676
  75%|███████▍ | 584/782 [05:21<02:10, 1.51it/s]
677
  75%|███████▍ | 585/782 [05:22<02:07, 1.55it/s]
678
  75%|███████▍ | 586/782 [05:22<02:08, 1.53it/s]
679
  75%|███████▌ | 587/782 [05:23<02:11, 1.49it/s]
680
  75%|███████▌ | 588/782 [05:24<02:07, 1.52it/s]
681
  75%|███████▌ | 589/782 [05:24<02:09, 1.49it/s]
682
  75%|███████▌ | 590/782 [05:25<02:09, 1.49it/s]
683
  76%|███████▌ | 591/782 [05:26<02:05, 1.52it/s]
684
  76%|███████▌ | 592/782 [05:26<02:03, 1.54it/s]
685
  76%|███████▌ | 593/782 [05:27<02:01, 1.55it/s]
686
  76%|███████▌ | 594/782 [05:27<02:02, 1.53it/s]
687
  76%|███████▌ | 595/782 [05:28<02:01, 1.54it/s]
688
  76%|███████▌ | 596/782 [05:29<02:00, 1.54it/s]
689
  76%|███████▋ | 597/782 [05:29<02:01, 1.52it/s]
690
  76%|███████▋ | 598/782 [05:30<02:00, 1.53it/s]
691
  77%|███████▋ | 599/782 [05:31<01:56, 1.57it/s]
692
  77%|███████▋ | 600/782 [05:31<01:57, 1.54it/s]
693
 
694
+
695
  77%|███████▋ | 600/782 [05:31<01:57, 1.54it/s]
696
  77%|███████▋ | 601/782 [05:32<01:59, 1.52it/s]
697
  77%|███████▋ | 602/782 [05:33<01:56, 1.55it/s]
698
  77%|███████▋ | 603/782 [05:33<01:58, 1.51it/s]
699
  77%|███████▋ | 604/782 [05:34<02:01, 1.47it/s]
700
  77%|███████▋ | 605/782 [05:35<01:58, 1.49it/s]
701
  77%|███████▋ | 606/782 [05:35<01:55, 1.52it/s]
702
  78%|███████▊ | 607/782 [05:36<01:55, 1.51it/s]
703
  78%|███████▊ | 608/782 [05:37<01:50, 1.57it/s]
704
  78%|███████▊ | 609/782 [05:37<01:52, 1.54it/s]
705
  78%|███████▊ | 610/782 [05:38<01:57, 1.46it/s]
706
  78%|███████▊ | 611/782 [05:39<01:53, 1.51it/s]
707
  78%|███████▊ | 612/782 [05:39<01:55, 1.48it/s]
708
  78%|███████▊ | 613/782 [05:40<01:51, 1.52it/s]
709
  79%|███████▊ | 614/782 [05:41<01:48, 1.54it/s]
710
  79%|███████▊ | 615/782 [05:41<01:48, 1.54it/s]
711
  79%|███████▉ | 616/782 [05:42<01:51, 1.49it/s]
712
  79%|███████▉ | 617/782 [05:43<01:48, 1.53it/s]
713
  79%|███████▉ | 618/782 [05:43<01:50, 1.48it/s]
714
  79%|███████▉ | 619/782 [05:44<01:50, 1.48it/s]
715
  79%|███████▉ | 620/782 [05:45<01:48, 1.49it/s]
716
  79%|███████▉ | 621/782 [05:45<01:48, 1.48it/s]
717
  80%|███████▉ | 622/782 [05:46<01:47, 1.49it/s]
718
  80%|███████▉ | 623/782 [05:47<01:43, 1.54it/s]
719
  80%|███████▉ | 624/782 [05:47<01:42, 1.53it/s]
720
  80%|███████▉ | 625/782 [05:48<01:42, 1.53it/s]
721
  80%|████████ | 626/782 [05:49<01:42, 1.52it/s]
722
  80%|████████ | 627/782 [05:49<01:43, 1.50it/s]
723
  80%|████████ | 628/782 [05:50<01:42, 1.51it/s]
724
  80%|████████ | 629/782 [05:51<01:38, 1.56it/s]
725
  81%|████████ | 630/782 [05:51<01:43, 1.46it/s]
726
  81%|████████ | 631/782 [05:52<01:41, 1.48it/s]
727
  81%|████████ | 632/782 [05:52<01:33, 1.61it/s]
728
  81%|████████ | 633/782 [05:53<01:28, 1.69it/s]
729
  81%|████████ | 634/782 [05:54<01:27, 1.69it/s]
730
  81%|████████ | 635/782 [05:54<01:22, 1.78it/s]
731
  81%|████████▏ | 636/782 [05:55<01:22, 1.77it/s]
732
  81%|████████▏ | 637/782 [05:55<01:23, 1.73it/s]
733
  82%|████████▏ | 638/782 [05:56<01:21, 1.77it/s]
734
  82%|████████▏ | 639/782 [05:56<01:18, 1.82it/s]
735
  82%|████████▏ | 640/782 [05:57<01:18, 1.81it/s]
736
  82%|████████▏ | 641/782 [05:57<01:17, 1.83it/s]
737
  82%|████████▏ | 642/782 [05:58<01:14, 1.87it/s]
738
  82%|████████▏ | 643/782 [05:58<01:15, 1.85it/s]
739
  82%|████████▏ | 644/782 [05:59<01:14, 1.86it/s]
740
  82%|████████▏ | 645/782 [06:00<01:13, 1.85it/s]
741
  83%|████████▎ | 646/782 [06:00<01:13, 1.85it/s]
742
  83%|████████▎ | 647/782 [06:01<01:14, 1.82it/s]
743
  83%|████████▎ | 648/782 [06:01<01:11, 1.86it/s]
744
  83%|████████▎ | 649/782 [06:02<01:10, 1.88it/s]
745
  83%|████████▎ | 650/782 [06:02<01:11, 1.85it/s]
746
 
747
+
748
  83%|████████▎ | 650/782 [06:02<01:11, 1.85it/s]
749
  83%|████████▎ | 651/782 [06:03<01:10, 1.87it/s]
750
  83%|████████▎ | 652/782 [06:03<01:08, 1.89it/s]
751
  84%|████████▎ | 653/782 [06:04<01:11, 1.81it/s]
752
  84%|████████▎ | 654/782 [06:04<01:10, 1.83it/s]
753
  84%|████████▍ | 655/782 [06:05<01:07, 1.88it/s]
754
  84%|████████▍ | 656/782 [06:05<01:09, 1.83it/s]
755
  84%|████████▍ | 657/782 [06:06<01:08, 1.81it/s]
756
  84%|████████▍ | 658/782 [06:07<01:06, 1.88it/s]
757
  84%|████████▍ | 659/782 [06:07<01:06, 1.85it/s]
758
  84%|████████▍ | 660/782 [06:08<01:08, 1.79it/s]
759
  85%|████████▍ | 661/782 [06:08<01:04, 1.87it/s]
760
  85%|████████▍ | 662/782 [06:09<01:04, 1.86it/s]
761
  85%|████████▍ | 663/782 [06:09<01:05, 1.81it/s]
762
  85%|████████▍ | 664/782 [06:10<01:03, 1.86it/s]
763
  85%|████████▌ | 665/782 [06:10<01:03, 1.86it/s]
764
  85%|████████▌ | 666/782 [06:11<01:05, 1.78it/s]
765
  85%|████████▌ | 667/782 [06:11<01:01, 1.88it/s]
766
  85%|████████▌ | 668/782 [06:12<01:00, 1.88it/s]
767
  86%|████████▌ | 669/782 [06:12<01:00, 1.87it/s]
768
  86%|████████▌ | 670/782 [06:13<00:59, 1.88it/s]
769
  86%|████████▌ | 671/782 [06:14<00:58, 1.90it/s]
770
  86%|████████▌ | 672/782 [06:14<00:57, 1.92it/s]
771
  86%|████████▌ | 673/782 [06:15<00:58, 1.88it/s]
772
  86%|████████▌ | 674/782 [06:15<00:56, 1.90it/s]
773
  86%|████████▋ | 675/782 [06:16<00:55, 1.92it/s]
774
  86%|████████▋ | 676/782 [06:16<00:58, 1.82it/s]
775
  87%|████████▋ | 677/782 [06:17<00:58, 1.79it/s]
776
  87%|████████▋ | 678/782 [06:17<00:55, 1.88it/s]
777
  87%|████████▋ | 679/782 [06:18<00:55, 1.86it/s]
778
  87%|████████▋ | 680/782 [06:18<00:57, 1.77it/s]
779
  87%|████████▋ | 681/782 [06:19<00:53, 1.88it/s]
780
  87%|████████▋ | 682/782 [06:19<00:54, 1.84it/s]
781
  87%|████████▋ | 683/782 [06:20<00:54, 1.81it/s]
782
  87%|████████▋ | 684/782 [06:21<00:51, 1.90it/s]
783
  88%|████████��� | 685/782 [06:21<00:52, 1.85it/s]
784
  88%|████████▊ | 686/782 [06:22<00:52, 1.83it/s]
785
  88%|████████▊ | 687/782 [06:22<00:50, 1.89it/s]
786
  88%|████████▊ | 688/782 [06:23<00:49, 1.88it/s]
787
  88%|████████▊ | 689/782 [06:23<00:49, 1.89it/s]
788
  88%|████████▊ | 690/782 [06:24<00:49, 1.87it/s]
789
  88%|████████▊ | 691/782 [06:24<00:48, 1.89it/s]
790
  88%|████████▊ | 692/782 [06:25<00:47, 1.90it/s]
791
  89%|████████▊ | 693/782 [06:25<00:46, 1.90it/s]
792
  89%|████████▊ | 694/782 [06:26<00:46, 1.90it/s]
793
  89%|████████▉ | 695/782 [06:26<00:47, 1.84it/s]
794
  89%|████████▉ | 696/782 [06:27<00:45, 1.89it/s]
795
  89%|████████▉ | 697/782 [06:27<00:45, 1.87it/s]
796
  89%|████████▉ | 698/782 [06:28<00:44, 1.88it/s]
797
  89%|████████▉ | 699/782 [06:29<00:44, 1.85it/s]
798
  90%|████████▉ | 700/782 [06:29<00:43, 1.88it/s]
799
 
800
+
801
  90%|████████▉ | 700/782 [06:29<00:43, 1.88it/s]
802
  90%|████████▉ | 701/782 [06:30<00:43, 1.87it/s]
803
  90%|████████▉ | 702/782 [06:30<00:44, 1.80it/s]
804
  90%|████████▉ | 703/782 [06:31<00:44, 1.79it/s]
805
  90%|█████████ | 704/782 [06:31<00:41, 1.86it/s]
806
  90%|█████████ | 705/782 [06:32<00:41, 1.84it/s]
807
  90%|█████████ | 706/782 [06:32<00:40, 1.87it/s]
808
  90%|█████████ | 707/782 [06:33<00:39, 1.89it/s]
809
  91%|█████████ | 708/782 [06:33<00:39, 1.89it/s]
810
  91%|█████████ | 709/782 [06:34<00:38, 1.89it/s]
811
  91%|█████████ | 710/782 [06:34<00:39, 1.83it/s]
812
  91%|█████████ | 711/782 [06:35<00:38, 1.86it/s]
813
  91%|█████████ | 712/782 [06:36<00:37, 1.88it/s]
814
  91%|█████████ | 713/782 [06:36<00:37, 1.84it/s]
815
  91%|█████████▏| 714/782 [06:37<00:37, 1.82it/s]
816
  91%|█████████▏| 715/782 [06:37<00:35, 1.87it/s]
817
  92%|█████████▏| 716/782 [06:38<00:35, 1.86it/s]
818
  92%|█████████▏| 717/782 [06:38<00:35, 1.84it/s]
819
  92%|█████████▏| 718/782 [06:39<00:34, 1.87it/s]
820
  92%|█████████▏| 719/782 [06:39<00:33, 1.86it/s]
821
  92%|█████████▏| 720/782 [06:40<00:33, 1.87it/s]
822
  92%|█████████▏| 721/782 [06:40<00:32, 1.87it/s]
823
  92%|█████████▏| 722/782 [06:41<00:31, 1.91it/s]
824
  92%|█████████▏| 723/782 [06:41<00:30, 1.91it/s]
825
  93%|█████████▎| 724/782 [06:42<00:31, 1.84it/s]
826
  93%|█████████▎| 725/782 [06:43<00:31, 1.82it/s]
827
  93%|█████████▎| 726/782 [06:43<00:31, 1.77it/s]
828
  93%|█████████▎| 727/782 [06:44<00:30, 1.80it/s]
829
  93%|█████████▎| 728/782 [06:44<00:29, 1.81it/s]
830
  93%|█████████▎| 729/782 [06:45<00:29, 1.82it/s]
831
  93%|█████████▎| 730/782 [06:45<00:28, 1.85it/s]
832
  93%|█████████▎| 731/782 [06:46<00:27, 1.86it/s]
833
  94%|█████████▎| 732/782 [06:46<00:27, 1.85it/s]
834
  94%|█████████▎| 733/782 [06:47<00:26, 1.88it/s]
835
  94%|█████████▍| 734/782 [06:47<00:25, 1.86it/s]
836
  94%|█████████▍| 735/782 [06:48<00:25, 1.85it/s]
837
  94%|█████████▍| 736/782 [06:49<00:24, 1.88it/s]
838
  94%|█████████▍| 737/782 [06:49<00:23, 1.89it/s]
839
  94%|█████████▍| 738/782 [06:50<00:23, 1.88it/s]
840
  95%|█████████▍| 739/782 [06:50<00:22, 1.90it/s]
841
  95%|█████████▍| 740/782 [06:51<00:22, 1.90it/s]
842
  95%|█████████▍| 741/782 [06:51<00:22, 1.85it/s]
843
  95%|█████████▍| 742/782 [06:52<00:21, 1.89it/s]
844
  95%|█████████▌| 743/782 [06:52<00:20, 1.91it/s]
845
  95%|█████████▌| 744/782 [06:53<00:20, 1.84it/s]
846
  95%|█████████▌| 745/782 [06:53<00:19, 1.88it/s]
847
  95%|█████████▌| 746/782 [06:54<00:19, 1.88it/s]
848
  96%|█████████▌| 747/782 [06:54<00:19, 1.83it/s]
849
  96%|█████████▌| 748/782 [06:55<00:18, 1.82it/s]
850
  96%|█████████▌| 749/782 [06:55<00:17, 1.86it/s]
851
  96%|█████████▌| 750/782 [06:56<00:17, 1.81it/s]
852
 
853
+
854
  96%|█████████▌| 750/782 [06:56<00:17, 1.81it/s]
855
  96%|█████████▌| 751/782 [06:57<00:17, 1.73it/s]
856
  96%|█████████▌| 752/782 [06:57<00:16, 1.82it/s]
857
  96%|█████████▋| 753/782 [06:58<00:15, 1.83it/s]
858
  96%|█████████▋| 754/782 [06:58<00:15, 1.80it/s]
859
  97%|█████████▋| 755/782 [06:59<00:14, 1.82it/s]
860
  97%|█████████▋| 756/782 [06:59<00:14, 1.83it/s]
861
  97%|█████████▋| 757/782 [07:00<00:13, 1.82it/s]
862
  97%|█████████▋| 758/782 [07:00<00:13, 1.80it/s]
863
  97%|█████████▋| 759/782 [07:01<00:12, 1.83it/s]
864
  97%|█████████▋| 760/782 [07:02<00:11, 1.89it/s]
865
  97%|█████████▋| 761/782 [07:02<00:11, 1.90it/s]
866
  97%|█████████▋| 762/782 [07:03<00:10, 1.90it/s]
867
  98%|█████████▊| 763/782 [07:03<00:09, 1.91it/s]
868
  98%|█████████▊| 764/782 [07:04<00:09, 1.89it/s]
869
  98%|█████████▊| 765/782 [07:04<00:09, 1.88it/s]
870
  98%|█████████▊| 766/782 [07:05<00:08, 1.86it/s]
871
  98%|█████████▊| 767/782 [07:05<00:08, 1.85it/s]
872
  98%|█████████▊| 768/782 [07:06<00:07, 1.87it/s]
873
  98%|█████████▊| 769/782 [07:06<00:06, 1.87it/s]
874
  98%|█████████▊| 770/782 [07:07<00:06, 1.86it/s]
875
  99%|█████████▊| 771/782 [07:07<00:05, 1.90it/s]
876
  99%|█████████▊| 772/782 [07:08<00:05, 1.92it/s]
877
  99%|█████████▉| 773/782 [07:08<00:04, 1.85it/s]
878
  99%|█████████▉| 774/782 [07:09<00:04, 1.85it/s]
879
  99%|█████████▉| 775/782 [07:09<00:03, 1.91it/s]
880
  99%|█████████▉| 776/782 [07:10<00:03, 1.90it/s]
881
  99%|█████████▉| 777/782 [07:11<00:02, 1.90it/s]
882
  99%|█████████▉| 778/782 [07:11<00:02, 1.92it/s]
883
 
884
+
885
+
886
+
887
+
888
+
889
+
890
+
891
+
892
+
893
+
894
+
895
+
896
+
README.md ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: transformers
3
+ license: apache-2.0
4
+ base_model: google/t5-v1_1-large
5
+ tags:
6
+ - generated_from_trainer
7
+ model-index:
8
+ - name: google_t5-v1_1-large_ds100_upsample1000
9
+ results: []
10
+ ---
11
+
12
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
13
+ should probably proofread and complete it, then remove this comment. -->
14
+
15
+ # google_t5-v1_1-large_ds100_upsample1000
16
+
17
+ This model is a fine-tuned version of [google/t5-v1_1-large](https://huggingface.co/google/t5-v1_1-large) on an unknown dataset.
18
+
19
+ ## Model description
20
+
21
+ More information needed
22
+
23
+ ## Intended uses & limitations
24
+
25
+ More information needed
26
+
27
+ ## Training and evaluation data
28
+
29
+ More information needed
30
+
31
+ ## Training procedure
32
+
33
+ ### Training hyperparameters
34
+
35
+ The following hyperparameters were used during training:
36
+ - learning_rate: 0.0001
37
+ - train_batch_size: 64
38
+ - eval_batch_size: 8
39
+ - seed: 42
40
+ - distributed_type: multi-GPU
41
+ - num_devices: 2
42
+ - total_train_batch_size: 128
43
+ - total_eval_batch_size: 16
44
+ - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
45
+ - lr_scheduler_type: linear
46
+ - num_epochs: 1.0
47
+
48
+ ### Training results
49
+
50
+
51
+
52
+ ### Framework versions
53
+
54
+ - Transformers 4.51.3
55
+ - Pytorch 2.6.0+cu124
56
+ - Datasets 3.6.0
57
+ - Tokenizers 0.21.1
added_tokens.json ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<extra_id_0>": 32099,
3
+ "<extra_id_10>": 32089,
4
+ "<extra_id_11>": 32088,
5
+ "<extra_id_12>": 32087,
6
+ "<extra_id_13>": 32086,
7
+ "<extra_id_14>": 32085,
8
+ "<extra_id_15>": 32084,
9
+ "<extra_id_16>": 32083,
10
+ "<extra_id_17>": 32082,
11
+ "<extra_id_18>": 32081,
12
+ "<extra_id_19>": 32080,
13
+ "<extra_id_1>": 32098,
14
+ "<extra_id_20>": 32079,
15
+ "<extra_id_21>": 32078,
16
+ "<extra_id_22>": 32077,
17
+ "<extra_id_23>": 32076,
18
+ "<extra_id_24>": 32075,
19
+ "<extra_id_25>": 32074,
20
+ "<extra_id_26>": 32073,
21
+ "<extra_id_27>": 32072,
22
+ "<extra_id_28>": 32071,
23
+ "<extra_id_29>": 32070,
24
+ "<extra_id_2>": 32097,
25
+ "<extra_id_30>": 32069,
26
+ "<extra_id_31>": 32068,
27
+ "<extra_id_32>": 32067,
28
+ "<extra_id_33>": 32066,
29
+ "<extra_id_34>": 32065,
30
+ "<extra_id_35>": 32064,
31
+ "<extra_id_36>": 32063,
32
+ "<extra_id_37>": 32062,
33
+ "<extra_id_38>": 32061,
34
+ "<extra_id_39>": 32060,
35
+ "<extra_id_3>": 32096,
36
+ "<extra_id_40>": 32059,
37
+ "<extra_id_41>": 32058,
38
+ "<extra_id_42>": 32057,
39
+ "<extra_id_43>": 32056,
40
+ "<extra_id_44>": 32055,
41
+ "<extra_id_45>": 32054,
42
+ "<extra_id_46>": 32053,
43
+ "<extra_id_47>": 32052,
44
+ "<extra_id_48>": 32051,
45
+ "<extra_id_49>": 32050,
46
+ "<extra_id_4>": 32095,
47
+ "<extra_id_50>": 32049,
48
+ "<extra_id_51>": 32048,
49
+ "<extra_id_52>": 32047,
50
+ "<extra_id_53>": 32046,
51
+ "<extra_id_54>": 32045,
52
+ "<extra_id_55>": 32044,
53
+ "<extra_id_56>": 32043,
54
+ "<extra_id_57>": 32042,
55
+ "<extra_id_58>": 32041,
56
+ "<extra_id_59>": 32040,
57
+ "<extra_id_5>": 32094,
58
+ "<extra_id_60>": 32039,
59
+ "<extra_id_61>": 32038,
60
+ "<extra_id_62>": 32037,
61
+ "<extra_id_63>": 32036,
62
+ "<extra_id_64>": 32035,
63
+ "<extra_id_65>": 32034,
64
+ "<extra_id_66>": 32033,
65
+ "<extra_id_67>": 32032,
66
+ "<extra_id_68>": 32031,
67
+ "<extra_id_69>": 32030,
68
+ "<extra_id_6>": 32093,
69
+ "<extra_id_70>": 32029,
70
+ "<extra_id_71>": 32028,
71
+ "<extra_id_72>": 32027,
72
+ "<extra_id_73>": 32026,
73
+ "<extra_id_74>": 32025,
74
+ "<extra_id_75>": 32024,
75
+ "<extra_id_76>": 32023,
76
+ "<extra_id_77>": 32022,
77
+ "<extra_id_78>": 32021,
78
+ "<extra_id_79>": 32020,
79
+ "<extra_id_7>": 32092,
80
+ "<extra_id_80>": 32019,
81
+ "<extra_id_81>": 32018,
82
+ "<extra_id_82>": 32017,
83
+ "<extra_id_83>": 32016,
84
+ "<extra_id_84>": 32015,
85
+ "<extra_id_85>": 32014,
86
+ "<extra_id_86>": 32013,
87
+ "<extra_id_87>": 32012,
88
+ "<extra_id_88>": 32011,
89
+ "<extra_id_89>": 32010,
90
+ "<extra_id_8>": 32091,
91
+ "<extra_id_90>": 32009,
92
+ "<extra_id_91>": 32008,
93
+ "<extra_id_92>": 32007,
94
+ "<extra_id_93>": 32006,
95
+ "<extra_id_94>": 32005,
96
+ "<extra_id_95>": 32004,
97
+ "<extra_id_96>": 32003,
98
+ "<extra_id_97>": 32002,
99
+ "<extra_id_98>": 32001,
100
+ "<extra_id_99>": 32000,
101
+ "<extra_id_9>": 32090
102
+ }
config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "T5ForConditionalGeneration"
4
+ ],
5
+ "classifier_dropout": 0.0,
6
+ "d_ff": 2816,
7
+ "d_kv": 64,
8
+ "d_model": 1024,
9
+ "decoder_start_token_id": 0,
10
+ "dense_act_fn": "gelu_new",
11
+ "dropout_rate": 0.1,
12
+ "eos_token_id": 1,
13
+ "feed_forward_proj": "gated-gelu",
14
+ "initializer_factor": 1.0,
15
+ "is_encoder_decoder": true,
16
+ "is_gated_act": true,
17
+ "layer_norm_epsilon": 1e-06,
18
+ "model_type": "t5",
19
+ "num_decoder_layers": 24,
20
+ "num_heads": 16,
21
+ "num_layers": 24,
22
+ "output_past": true,
23
+ "pad_token_id": 0,
24
+ "relative_attention_max_distance": 128,
25
+ "relative_attention_num_buckets": 32,
26
+ "tie_word_embeddings": false,
27
+ "torch_dtype": "float32",
28
+ "transformers_version": "4.51.3",
29
+ "use_cache": true,
30
+ "vocab_size": 32128
31
+ }
generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "decoder_start_token_id": 0,
4
+ "eos_token_id": 1,
5
+ "pad_token_id": 0,
6
+ "transformers_version": "4.51.3"
7
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be0e82516518c40428bed4ba7599cb602ce7616116c12519d19d8e0cb78f8964
3
+ size 3132668808
special_tokens_map.json ADDED
@@ -0,0 +1,125 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<extra_id_0>",
4
+ "<extra_id_1>",
5
+ "<extra_id_2>",
6
+ "<extra_id_3>",
7
+ "<extra_id_4>",
8
+ "<extra_id_5>",
9
+ "<extra_id_6>",
10
+ "<extra_id_7>",
11
+ "<extra_id_8>",
12
+ "<extra_id_9>",
13
+ "<extra_id_10>",
14
+ "<extra_id_11>",
15
+ "<extra_id_12>",
16
+ "<extra_id_13>",
17
+ "<extra_id_14>",
18
+ "<extra_id_15>",
19
+ "<extra_id_16>",
20
+ "<extra_id_17>",
21
+ "<extra_id_18>",
22
+ "<extra_id_19>",
23
+ "<extra_id_20>",
24
+ "<extra_id_21>",
25
+ "<extra_id_22>",
26
+ "<extra_id_23>",
27
+ "<extra_id_24>",
28
+ "<extra_id_25>",
29
+ "<extra_id_26>",
30
+ "<extra_id_27>",
31
+ "<extra_id_28>",
32
+ "<extra_id_29>",
33
+ "<extra_id_30>",
34
+ "<extra_id_31>",
35
+ "<extra_id_32>",
36
+ "<extra_id_33>",
37
+ "<extra_id_34>",
38
+ "<extra_id_35>",
39
+ "<extra_id_36>",
40
+ "<extra_id_37>",
41
+ "<extra_id_38>",
42
+ "<extra_id_39>",
43
+ "<extra_id_40>",
44
+ "<extra_id_41>",
45
+ "<extra_id_42>",
46
+ "<extra_id_43>",
47
+ "<extra_id_44>",
48
+ "<extra_id_45>",
49
+ "<extra_id_46>",
50
+ "<extra_id_47>",
51
+ "<extra_id_48>",
52
+ "<extra_id_49>",
53
+ "<extra_id_50>",
54
+ "<extra_id_51>",
55
+ "<extra_id_52>",
56
+ "<extra_id_53>",
57
+ "<extra_id_54>",
58
+ "<extra_id_55>",
59
+ "<extra_id_56>",
60
+ "<extra_id_57>",
61
+ "<extra_id_58>",
62
+ "<extra_id_59>",
63
+ "<extra_id_60>",
64
+ "<extra_id_61>",
65
+ "<extra_id_62>",
66
+ "<extra_id_63>",
67
+ "<extra_id_64>",
68
+ "<extra_id_65>",
69
+ "<extra_id_66>",
70
+ "<extra_id_67>",
71
+ "<extra_id_68>",
72
+ "<extra_id_69>",
73
+ "<extra_id_70>",
74
+ "<extra_id_71>",
75
+ "<extra_id_72>",
76
+ "<extra_id_73>",
77
+ "<extra_id_74>",
78
+ "<extra_id_75>",
79
+ "<extra_id_76>",
80
+ "<extra_id_77>",
81
+ "<extra_id_78>",
82
+ "<extra_id_79>",
83
+ "<extra_id_80>",
84
+ "<extra_id_81>",
85
+ "<extra_id_82>",
86
+ "<extra_id_83>",
87
+ "<extra_id_84>",
88
+ "<extra_id_85>",
89
+ "<extra_id_86>",
90
+ "<extra_id_87>",
91
+ "<extra_id_88>",
92
+ "<extra_id_89>",
93
+ "<extra_id_90>",
94
+ "<extra_id_91>",
95
+ "<extra_id_92>",
96
+ "<extra_id_93>",
97
+ "<extra_id_94>",
98
+ "<extra_id_95>",
99
+ "<extra_id_96>",
100
+ "<extra_id_97>",
101
+ "<extra_id_98>",
102
+ "<extra_id_99>"
103
+ ],
104
+ "eos_token": {
105
+ "content": "</s>",
106
+ "lstrip": false,
107
+ "normalized": false,
108
+ "rstrip": false,
109
+ "single_word": false
110
+ },
111
+ "pad_token": {
112
+ "content": "<pad>",
113
+ "lstrip": false,
114
+ "normalized": false,
115
+ "rstrip": false,
116
+ "single_word": false
117
+ },
118
+ "unk_token": {
119
+ "content": "<unk>",
120
+ "lstrip": false,
121
+ "normalized": false,
122
+ "rstrip": false,
123
+ "single_word": false
124
+ }
125
+ }
spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d60acb128cf7b7f2536e8f38a5b18a05535c9e14c7a355904270e15b0945ea86
3
+ size 791656
tokenizer_config.json ADDED
@@ -0,0 +1,942 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": true,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "<pad>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "</s>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "<unk>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "32000": {
29
+ "content": "<extra_id_99>",
30
+ "lstrip": true,
31
+ "normalized": false,
32
+ "rstrip": true,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "32001": {
37
+ "content": "<extra_id_98>",
38
+ "lstrip": true,
39
+ "normalized": false,
40
+ "rstrip": true,
41
+ "single_word": false,
42
+ "special": true
43
+ },
44
+ "32002": {
45
+ "content": "<extra_id_97>",
46
+ "lstrip": true,
47
+ "normalized": false,
48
+ "rstrip": true,
49
+ "single_word": false,
50
+ "special": true
51
+ },
52
+ "32003": {
53
+ "content": "<extra_id_96>",
54
+ "lstrip": true,
55
+ "normalized": false,
56
+ "rstrip": true,
57
+ "single_word": false,
58
+ "special": true
59
+ },
60
+ "32004": {
61
+ "content": "<extra_id_95>",
62
+ "lstrip": true,
63
+ "normalized": false,
64
+ "rstrip": true,
65
+ "single_word": false,
66
+ "special": true
67
+ },
68
+ "32005": {
69
+ "content": "<extra_id_94>",
70
+ "lstrip": true,
71
+ "normalized": false,
72
+ "rstrip": true,
73
+ "single_word": false,
74
+ "special": true
75
+ },
76
+ "32006": {
77
+ "content": "<extra_id_93>",
78
+ "lstrip": true,
79
+ "normalized": false,
80
+ "rstrip": true,
81
+ "single_word": false,
82
+ "special": true
83
+ },
84
+ "32007": {
85
+ "content": "<extra_id_92>",
86
+ "lstrip": true,
87
+ "normalized": false,
88
+ "rstrip": true,
89
+ "single_word": false,
90
+ "special": true
91
+ },
92
+ "32008": {
93
+ "content": "<extra_id_91>",
94
+ "lstrip": true,
95
+ "normalized": false,
96
+ "rstrip": true,
97
+ "single_word": false,
98
+ "special": true
99
+ },
100
+ "32009": {
101
+ "content": "<extra_id_90>",
102
+ "lstrip": true,
103
+ "normalized": false,
104
+ "rstrip": true,
105
+ "single_word": false,
106
+ "special": true
107
+ },
108
+ "32010": {
109
+ "content": "<extra_id_89>",
110
+ "lstrip": true,
111
+ "normalized": false,
112
+ "rstrip": true,
113
+ "single_word": false,
114
+ "special": true
115
+ },
116
+ "32011": {
117
+ "content": "<extra_id_88>",
118
+ "lstrip": true,
119
+ "normalized": false,
120
+ "rstrip": true,
121
+ "single_word": false,
122
+ "special": true
123
+ },
124
+ "32012": {
125
+ "content": "<extra_id_87>",
126
+ "lstrip": true,
127
+ "normalized": false,
128
+ "rstrip": true,
129
+ "single_word": false,
130
+ "special": true
131
+ },
132
+ "32013": {
133
+ "content": "<extra_id_86>",
134
+ "lstrip": true,
135
+ "normalized": false,
136
+ "rstrip": true,
137
+ "single_word": false,
138
+ "special": true
139
+ },
140
+ "32014": {
141
+ "content": "<extra_id_85>",
142
+ "lstrip": true,
143
+ "normalized": false,
144
+ "rstrip": true,
145
+ "single_word": false,
146
+ "special": true
147
+ },
148
+ "32015": {
149
+ "content": "<extra_id_84>",
150
+ "lstrip": true,
151
+ "normalized": false,
152
+ "rstrip": true,
153
+ "single_word": false,
154
+ "special": true
155
+ },
156
+ "32016": {
157
+ "content": "<extra_id_83>",
158
+ "lstrip": true,
159
+ "normalized": false,
160
+ "rstrip": true,
161
+ "single_word": false,
162
+ "special": true
163
+ },
164
+ "32017": {
165
+ "content": "<extra_id_82>",
166
+ "lstrip": true,
167
+ "normalized": false,
168
+ "rstrip": true,
169
+ "single_word": false,
170
+ "special": true
171
+ },
172
+ "32018": {
173
+ "content": "<extra_id_81>",
174
+ "lstrip": true,
175
+ "normalized": false,
176
+ "rstrip": true,
177
+ "single_word": false,
178
+ "special": true
179
+ },
180
+ "32019": {
181
+ "content": "<extra_id_80>",
182
+ "lstrip": true,
183
+ "normalized": false,
184
+ "rstrip": true,
185
+ "single_word": false,
186
+ "special": true
187
+ },
188
+ "32020": {
189
+ "content": "<extra_id_79>",
190
+ "lstrip": true,
191
+ "normalized": false,
192
+ "rstrip": true,
193
+ "single_word": false,
194
+ "special": true
195
+ },
196
+ "32021": {
197
+ "content": "<extra_id_78>",
198
+ "lstrip": true,
199
+ "normalized": false,
200
+ "rstrip": true,
201
+ "single_word": false,
202
+ "special": true
203
+ },
204
+ "32022": {
205
+ "content": "<extra_id_77>",
206
+ "lstrip": true,
207
+ "normalized": false,
208
+ "rstrip": true,
209
+ "single_word": false,
210
+ "special": true
211
+ },
212
+ "32023": {
213
+ "content": "<extra_id_76>",
214
+ "lstrip": true,
215
+ "normalized": false,
216
+ "rstrip": true,
217
+ "single_word": false,
218
+ "special": true
219
+ },
220
+ "32024": {
221
+ "content": "<extra_id_75>",
222
+ "lstrip": true,
223
+ "normalized": false,
224
+ "rstrip": true,
225
+ "single_word": false,
226
+ "special": true
227
+ },
228
+ "32025": {
229
+ "content": "<extra_id_74>",
230
+ "lstrip": true,
231
+ "normalized": false,
232
+ "rstrip": true,
233
+ "single_word": false,
234
+ "special": true
235
+ },
236
+ "32026": {
237
+ "content": "<extra_id_73>",
238
+ "lstrip": true,
239
+ "normalized": false,
240
+ "rstrip": true,
241
+ "single_word": false,
242
+ "special": true
243
+ },
244
+ "32027": {
245
+ "content": "<extra_id_72>",
246
+ "lstrip": true,
247
+ "normalized": false,
248
+ "rstrip": true,
249
+ "single_word": false,
250
+ "special": true
251
+ },
252
+ "32028": {
253
+ "content": "<extra_id_71>",
254
+ "lstrip": true,
255
+ "normalized": false,
256
+ "rstrip": true,
257
+ "single_word": false,
258
+ "special": true
259
+ },
260
+ "32029": {
261
+ "content": "<extra_id_70>",
262
+ "lstrip": true,
263
+ "normalized": false,
264
+ "rstrip": true,
265
+ "single_word": false,
266
+ "special": true
267
+ },
268
+ "32030": {
269
+ "content": "<extra_id_69>",
270
+ "lstrip": true,
271
+ "normalized": false,
272
+ "rstrip": true,
273
+ "single_word": false,
274
+ "special": true
275
+ },
276
+ "32031": {
277
+ "content": "<extra_id_68>",
278
+ "lstrip": true,
279
+ "normalized": false,
280
+ "rstrip": true,
281
+ "single_word": false,
282
+ "special": true
283
+ },
284
+ "32032": {
285
+ "content": "<extra_id_67>",
286
+ "lstrip": true,
287
+ "normalized": false,
288
+ "rstrip": true,
289
+ "single_word": false,
290
+ "special": true
291
+ },
292
+ "32033": {
293
+ "content": "<extra_id_66>",
294
+ "lstrip": true,
295
+ "normalized": false,
296
+ "rstrip": true,
297
+ "single_word": false,
298
+ "special": true
299
+ },
300
+ "32034": {
301
+ "content": "<extra_id_65>",
302
+ "lstrip": true,
303
+ "normalized": false,
304
+ "rstrip": true,
305
+ "single_word": false,
306
+ "special": true
307
+ },
308
+ "32035": {
309
+ "content": "<extra_id_64>",
310
+ "lstrip": true,
311
+ "normalized": false,
312
+ "rstrip": true,
313
+ "single_word": false,
314
+ "special": true
315
+ },
316
+ "32036": {
317
+ "content": "<extra_id_63>",
318
+ "lstrip": true,
319
+ "normalized": false,
320
+ "rstrip": true,
321
+ "single_word": false,
322
+ "special": true
323
+ },
324
+ "32037": {
325
+ "content": "<extra_id_62>",
326
+ "lstrip": true,
327
+ "normalized": false,
328
+ "rstrip": true,
329
+ "single_word": false,
330
+ "special": true
331
+ },
332
+ "32038": {
333
+ "content": "<extra_id_61>",
334
+ "lstrip": true,
335
+ "normalized": false,
336
+ "rstrip": true,
337
+ "single_word": false,
338
+ "special": true
339
+ },
340
+ "32039": {
341
+ "content": "<extra_id_60>",
342
+ "lstrip": true,
343
+ "normalized": false,
344
+ "rstrip": true,
345
+ "single_word": false,
346
+ "special": true
347
+ },
348
+ "32040": {
349
+ "content": "<extra_id_59>",
350
+ "lstrip": true,
351
+ "normalized": false,
352
+ "rstrip": true,
353
+ "single_word": false,
354
+ "special": true
355
+ },
356
+ "32041": {
357
+ "content": "<extra_id_58>",
358
+ "lstrip": true,
359
+ "normalized": false,
360
+ "rstrip": true,
361
+ "single_word": false,
362
+ "special": true
363
+ },
364
+ "32042": {
365
+ "content": "<extra_id_57>",
366
+ "lstrip": true,
367
+ "normalized": false,
368
+ "rstrip": true,
369
+ "single_word": false,
370
+ "special": true
371
+ },
372
+ "32043": {
373
+ "content": "<extra_id_56>",
374
+ "lstrip": true,
375
+ "normalized": false,
376
+ "rstrip": true,
377
+ "single_word": false,
378
+ "special": true
379
+ },
380
+ "32044": {
381
+ "content": "<extra_id_55>",
382
+ "lstrip": true,
383
+ "normalized": false,
384
+ "rstrip": true,
385
+ "single_word": false,
386
+ "special": true
387
+ },
388
+ "32045": {
389
+ "content": "<extra_id_54>",
390
+ "lstrip": true,
391
+ "normalized": false,
392
+ "rstrip": true,
393
+ "single_word": false,
394
+ "special": true
395
+ },
396
+ "32046": {
397
+ "content": "<extra_id_53>",
398
+ "lstrip": true,
399
+ "normalized": false,
400
+ "rstrip": true,
401
+ "single_word": false,
402
+ "special": true
403
+ },
404
+ "32047": {
405
+ "content": "<extra_id_52>",
406
+ "lstrip": true,
407
+ "normalized": false,
408
+ "rstrip": true,
409
+ "single_word": false,
410
+ "special": true
411
+ },
412
+ "32048": {
413
+ "content": "<extra_id_51>",
414
+ "lstrip": true,
415
+ "normalized": false,
416
+ "rstrip": true,
417
+ "single_word": false,
418
+ "special": true
419
+ },
420
+ "32049": {
421
+ "content": "<extra_id_50>",
422
+ "lstrip": true,
423
+ "normalized": false,
424
+ "rstrip": true,
425
+ "single_word": false,
426
+ "special": true
427
+ },
428
+ "32050": {
429
+ "content": "<extra_id_49>",
430
+ "lstrip": true,
431
+ "normalized": false,
432
+ "rstrip": true,
433
+ "single_word": false,
434
+ "special": true
435
+ },
436
+ "32051": {
437
+ "content": "<extra_id_48>",
438
+ "lstrip": true,
439
+ "normalized": false,
440
+ "rstrip": true,
441
+ "single_word": false,
442
+ "special": true
443
+ },
444
+ "32052": {
445
+ "content": "<extra_id_47>",
446
+ "lstrip": true,
447
+ "normalized": false,
448
+ "rstrip": true,
449
+ "single_word": false,
450
+ "special": true
451
+ },
452
+ "32053": {
453
+ "content": "<extra_id_46>",
454
+ "lstrip": true,
455
+ "normalized": false,
456
+ "rstrip": true,
457
+ "single_word": false,
458
+ "special": true
459
+ },
460
+ "32054": {
461
+ "content": "<extra_id_45>",
462
+ "lstrip": true,
463
+ "normalized": false,
464
+ "rstrip": true,
465
+ "single_word": false,
466
+ "special": true
467
+ },
468
+ "32055": {
469
+ "content": "<extra_id_44>",
470
+ "lstrip": true,
471
+ "normalized": false,
472
+ "rstrip": true,
473
+ "single_word": false,
474
+ "special": true
475
+ },
476
+ "32056": {
477
+ "content": "<extra_id_43>",
478
+ "lstrip": true,
479
+ "normalized": false,
480
+ "rstrip": true,
481
+ "single_word": false,
482
+ "special": true
483
+ },
484
+ "32057": {
485
+ "content": "<extra_id_42>",
486
+ "lstrip": true,
487
+ "normalized": false,
488
+ "rstrip": true,
489
+ "single_word": false,
490
+ "special": true
491
+ },
492
+ "32058": {
493
+ "content": "<extra_id_41>",
494
+ "lstrip": true,
495
+ "normalized": false,
496
+ "rstrip": true,
497
+ "single_word": false,
498
+ "special": true
499
+ },
500
+ "32059": {
501
+ "content": "<extra_id_40>",
502
+ "lstrip": true,
503
+ "normalized": false,
504
+ "rstrip": true,
505
+ "single_word": false,
506
+ "special": true
507
+ },
508
+ "32060": {
509
+ "content": "<extra_id_39>",
510
+ "lstrip": true,
511
+ "normalized": false,
512
+ "rstrip": true,
513
+ "single_word": false,
514
+ "special": true
515
+ },
516
+ "32061": {
517
+ "content": "<extra_id_38>",
518
+ "lstrip": true,
519
+ "normalized": false,
520
+ "rstrip": true,
521
+ "single_word": false,
522
+ "special": true
523
+ },
524
+ "32062": {
525
+ "content": "<extra_id_37>",
526
+ "lstrip": true,
527
+ "normalized": false,
528
+ "rstrip": true,
529
+ "single_word": false,
530
+ "special": true
531
+ },
532
+ "32063": {
533
+ "content": "<extra_id_36>",
534
+ "lstrip": true,
535
+ "normalized": false,
536
+ "rstrip": true,
537
+ "single_word": false,
538
+ "special": true
539
+ },
540
+ "32064": {
541
+ "content": "<extra_id_35>",
542
+ "lstrip": true,
543
+ "normalized": false,
544
+ "rstrip": true,
545
+ "single_word": false,
546
+ "special": true
547
+ },
548
+ "32065": {
549
+ "content": "<extra_id_34>",
550
+ "lstrip": true,
551
+ "normalized": false,
552
+ "rstrip": true,
553
+ "single_word": false,
554
+ "special": true
555
+ },
556
+ "32066": {
557
+ "content": "<extra_id_33>",
558
+ "lstrip": true,
559
+ "normalized": false,
560
+ "rstrip": true,
561
+ "single_word": false,
562
+ "special": true
563
+ },
564
+ "32067": {
565
+ "content": "<extra_id_32>",
566
+ "lstrip": true,
567
+ "normalized": false,
568
+ "rstrip": true,
569
+ "single_word": false,
570
+ "special": true
571
+ },
572
+ "32068": {
573
+ "content": "<extra_id_31>",
574
+ "lstrip": true,
575
+ "normalized": false,
576
+ "rstrip": true,
577
+ "single_word": false,
578
+ "special": true
579
+ },
580
+ "32069": {
581
+ "content": "<extra_id_30>",
582
+ "lstrip": true,
583
+ "normalized": false,
584
+ "rstrip": true,
585
+ "single_word": false,
586
+ "special": true
587
+ },
588
+ "32070": {
589
+ "content": "<extra_id_29>",
590
+ "lstrip": true,
591
+ "normalized": false,
592
+ "rstrip": true,
593
+ "single_word": false,
594
+ "special": true
595
+ },
596
+ "32071": {
597
+ "content": "<extra_id_28>",
598
+ "lstrip": true,
599
+ "normalized": false,
600
+ "rstrip": true,
601
+ "single_word": false,
602
+ "special": true
603
+ },
604
+ "32072": {
605
+ "content": "<extra_id_27>",
606
+ "lstrip": true,
607
+ "normalized": false,
608
+ "rstrip": true,
609
+ "single_word": false,
610
+ "special": true
611
+ },
612
+ "32073": {
613
+ "content": "<extra_id_26>",
614
+ "lstrip": true,
615
+ "normalized": false,
616
+ "rstrip": true,
617
+ "single_word": false,
618
+ "special": true
619
+ },
620
+ "32074": {
621
+ "content": "<extra_id_25>",
622
+ "lstrip": true,
623
+ "normalized": false,
624
+ "rstrip": true,
625
+ "single_word": false,
626
+ "special": true
627
+ },
628
+ "32075": {
629
+ "content": "<extra_id_24>",
630
+ "lstrip": true,
631
+ "normalized": false,
632
+ "rstrip": true,
633
+ "single_word": false,
634
+ "special": true
635
+ },
636
+ "32076": {
637
+ "content": "<extra_id_23>",
638
+ "lstrip": true,
639
+ "normalized": false,
640
+ "rstrip": true,
641
+ "single_word": false,
642
+ "special": true
643
+ },
644
+ "32077": {
645
+ "content": "<extra_id_22>",
646
+ "lstrip": true,
647
+ "normalized": false,
648
+ "rstrip": true,
649
+ "single_word": false,
650
+ "special": true
651
+ },
652
+ "32078": {
653
+ "content": "<extra_id_21>",
654
+ "lstrip": true,
655
+ "normalized": false,
656
+ "rstrip": true,
657
+ "single_word": false,
658
+ "special": true
659
+ },
660
+ "32079": {
661
+ "content": "<extra_id_20>",
662
+ "lstrip": true,
663
+ "normalized": false,
664
+ "rstrip": true,
665
+ "single_word": false,
666
+ "special": true
667
+ },
668
+ "32080": {
669
+ "content": "<extra_id_19>",
670
+ "lstrip": true,
671
+ "normalized": false,
672
+ "rstrip": true,
673
+ "single_word": false,
674
+ "special": true
675
+ },
676
+ "32081": {
677
+ "content": "<extra_id_18>",
678
+ "lstrip": true,
679
+ "normalized": false,
680
+ "rstrip": true,
681
+ "single_word": false,
682
+ "special": true
683
+ },
684
+ "32082": {
685
+ "content": "<extra_id_17>",
686
+ "lstrip": true,
687
+ "normalized": false,
688
+ "rstrip": true,
689
+ "single_word": false,
690
+ "special": true
691
+ },
692
+ "32083": {
693
+ "content": "<extra_id_16>",
694
+ "lstrip": true,
695
+ "normalized": false,
696
+ "rstrip": true,
697
+ "single_word": false,
698
+ "special": true
699
+ },
700
+ "32084": {
701
+ "content": "<extra_id_15>",
702
+ "lstrip": true,
703
+ "normalized": false,
704
+ "rstrip": true,
705
+ "single_word": false,
706
+ "special": true
707
+ },
708
+ "32085": {
709
+ "content": "<extra_id_14>",
710
+ "lstrip": true,
711
+ "normalized": false,
712
+ "rstrip": true,
713
+ "single_word": false,
714
+ "special": true
715
+ },
716
+ "32086": {
717
+ "content": "<extra_id_13>",
718
+ "lstrip": true,
719
+ "normalized": false,
720
+ "rstrip": true,
721
+ "single_word": false,
722
+ "special": true
723
+ },
724
+ "32087": {
725
+ "content": "<extra_id_12>",
726
+ "lstrip": true,
727
+ "normalized": false,
728
+ "rstrip": true,
729
+ "single_word": false,
730
+ "special": true
731
+ },
732
+ "32088": {
733
+ "content": "<extra_id_11>",
734
+ "lstrip": true,
735
+ "normalized": false,
736
+ "rstrip": true,
737
+ "single_word": false,
738
+ "special": true
739
+ },
740
+ "32089": {
741
+ "content": "<extra_id_10>",
742
+ "lstrip": true,
743
+ "normalized": false,
744
+ "rstrip": true,
745
+ "single_word": false,
746
+ "special": true
747
+ },
748
+ "32090": {
749
+ "content": "<extra_id_9>",
750
+ "lstrip": true,
751
+ "normalized": false,
752
+ "rstrip": true,
753
+ "single_word": false,
754
+ "special": true
755
+ },
756
+ "32091": {
757
+ "content": "<extra_id_8>",
758
+ "lstrip": true,
759
+ "normalized": false,
760
+ "rstrip": true,
761
+ "single_word": false,
762
+ "special": true
763
+ },
764
+ "32092": {
765
+ "content": "<extra_id_7>",
766
+ "lstrip": true,
767
+ "normalized": false,
768
+ "rstrip": true,
769
+ "single_word": false,
770
+ "special": true
771
+ },
772
+ "32093": {
773
+ "content": "<extra_id_6>",
774
+ "lstrip": true,
775
+ "normalized": false,
776
+ "rstrip": true,
777
+ "single_word": false,
778
+ "special": true
779
+ },
780
+ "32094": {
781
+ "content": "<extra_id_5>",
782
+ "lstrip": true,
783
+ "normalized": false,
784
+ "rstrip": true,
785
+ "single_word": false,
786
+ "special": true
787
+ },
788
+ "32095": {
789
+ "content": "<extra_id_4>",
790
+ "lstrip": true,
791
+ "normalized": false,
792
+ "rstrip": true,
793
+ "single_word": false,
794
+ "special": true
795
+ },
796
+ "32096": {
797
+ "content": "<extra_id_3>",
798
+ "lstrip": true,
799
+ "normalized": false,
800
+ "rstrip": true,
801
+ "single_word": false,
802
+ "special": true
803
+ },
804
+ "32097": {
805
+ "content": "<extra_id_2>",
806
+ "lstrip": true,
807
+ "normalized": false,
808
+ "rstrip": true,
809
+ "single_word": false,
810
+ "special": true
811
+ },
812
+ "32098": {
813
+ "content": "<extra_id_1>",
814
+ "lstrip": true,
815
+ "normalized": false,
816
+ "rstrip": true,
817
+ "single_word": false,
818
+ "special": true
819
+ },
820
+ "32099": {
821
+ "content": "<extra_id_0>",
822
+ "lstrip": true,
823
+ "normalized": false,
824
+ "rstrip": true,
825
+ "single_word": false,
826
+ "special": true
827
+ }
828
+ },
829
+ "additional_special_tokens": [
830
+ "<extra_id_0>",
831
+ "<extra_id_1>",
832
+ "<extra_id_2>",
833
+ "<extra_id_3>",
834
+ "<extra_id_4>",
835
+ "<extra_id_5>",
836
+ "<extra_id_6>",
837
+ "<extra_id_7>",
838
+ "<extra_id_8>",
839
+ "<extra_id_9>",
840
+ "<extra_id_10>",
841
+ "<extra_id_11>",
842
+ "<extra_id_12>",
843
+ "<extra_id_13>",
844
+ "<extra_id_14>",
845
+ "<extra_id_15>",
846
+ "<extra_id_16>",
847
+ "<extra_id_17>",
848
+ "<extra_id_18>",
849
+ "<extra_id_19>",
850
+ "<extra_id_20>",
851
+ "<extra_id_21>",
852
+ "<extra_id_22>",
853
+ "<extra_id_23>",
854
+ "<extra_id_24>",
855
+ "<extra_id_25>",
856
+ "<extra_id_26>",
857
+ "<extra_id_27>",
858
+ "<extra_id_28>",
859
+ "<extra_id_29>",
860
+ "<extra_id_30>",
861
+ "<extra_id_31>",
862
+ "<extra_id_32>",
863
+ "<extra_id_33>",
864
+ "<extra_id_34>",
865
+ "<extra_id_35>",
866
+ "<extra_id_36>",
867
+ "<extra_id_37>",
868
+ "<extra_id_38>",
869
+ "<extra_id_39>",
870
+ "<extra_id_40>",
871
+ "<extra_id_41>",
872
+ "<extra_id_42>",
873
+ "<extra_id_43>",
874
+ "<extra_id_44>",
875
+ "<extra_id_45>",
876
+ "<extra_id_46>",
877
+ "<extra_id_47>",
878
+ "<extra_id_48>",
879
+ "<extra_id_49>",
880
+ "<extra_id_50>",
881
+ "<extra_id_51>",
882
+ "<extra_id_52>",
883
+ "<extra_id_53>",
884
+ "<extra_id_54>",
885
+ "<extra_id_55>",
886
+ "<extra_id_56>",
887
+ "<extra_id_57>",
888
+ "<extra_id_58>",
889
+ "<extra_id_59>",
890
+ "<extra_id_60>",
891
+ "<extra_id_61>",
892
+ "<extra_id_62>",
893
+ "<extra_id_63>",
894
+ "<extra_id_64>",
895
+ "<extra_id_65>",
896
+ "<extra_id_66>",
897
+ "<extra_id_67>",
898
+ "<extra_id_68>",
899
+ "<extra_id_69>",
900
+ "<extra_id_70>",
901
+ "<extra_id_71>",
902
+ "<extra_id_72>",
903
+ "<extra_id_73>",
904
+ "<extra_id_74>",
905
+ "<extra_id_75>",
906
+ "<extra_id_76>",
907
+ "<extra_id_77>",
908
+ "<extra_id_78>",
909
+ "<extra_id_79>",
910
+ "<extra_id_80>",
911
+ "<extra_id_81>",
912
+ "<extra_id_82>",
913
+ "<extra_id_83>",
914
+ "<extra_id_84>",
915
+ "<extra_id_85>",
916
+ "<extra_id_86>",
917
+ "<extra_id_87>",
918
+ "<extra_id_88>",
919
+ "<extra_id_89>",
920
+ "<extra_id_90>",
921
+ "<extra_id_91>",
922
+ "<extra_id_92>",
923
+ "<extra_id_93>",
924
+ "<extra_id_94>",
925
+ "<extra_id_95>",
926
+ "<extra_id_96>",
927
+ "<extra_id_97>",
928
+ "<extra_id_98>",
929
+ "<extra_id_99>"
930
+ ],
931
+ "clean_up_tokenization_spaces": false,
932
+ "eos_token": "</s>",
933
+ "extra_ids": 100,
934
+ "extra_special_tokens": {},
935
+ "legacy": true,
936
+ "model_max_length": 32768,
937
+ "pad_token": "<pad>",
938
+ "padding_side": "right",
939
+ "sp_model_kwargs": {},
940
+ "tokenizer_class": "T5Tokenizer",
941
+ "unk_token": "<unk>"
942
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f44a57468978cd51e95a6dcbccb3d038c415aff86a8c4e29f117ba99cb8fdb2b
3
+ size 5368