furmaniak commited on
Commit
27a14b5
·
verified ·
1 Parent(s): ee323e5

Training in progress, step 355

Browse files
model-00001-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d50c4cd12cb541285066357be1584c142285981fc00429bd054bf07472ab55e5
3
  size 4891730992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83b6d09c36dfde2dde2aca411c8cf9b8b73c48deeb0f16bb48de6800e95b6b08
3
  size 4891730992
model-00002-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8377fefc4225b886564e54582aeb0fd9cbd286197627d2111d2d0ab7343e3bd5
3
  size 4876059352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9095a1411aa42afdc93bdaf3630b02d51b6549559bdeb9c60bbbc70b838d440
3
  size 4876059352
model-00003-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c132bb7b19a8ab698cd2d4f2c51ed2a4c3a9f2ba13e0e8727a7687a7eafc57a
3
  size 4876059384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2109ad4a5b21fa3d65cc3c8d891e2c2f0a5209cc9eb3ea9014b7e62c4ab716c
3
  size 4876059384
model-00004-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:336a925a4d307f0bfda4124a8895a16cb05247ba0627851d4482ab4bf69fdc93
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d863c759c7dde217501fcb16ed614dd9c6c2461d1fe6b0b90634fd7132cd09e3
3
  size 4876059416
model-00005-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f72a554fc5cae4d17d2503956e6885dda4551c9c4dbf9fc76994c7b311f37b54
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10d545e0cdd6292e08f02aafcdc85c971869d85197923faa1f2f809fb26f8eab
3
  size 4876059416
model-00006-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11655f97daf781faa1d9a011e8970be6ce59065631efdc0d8556b5b89e42d1eb
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3609a8a0ba532d5c70bd27c6d33e3600fa52039c254469f7c72b4b003ad84ac7
3
  size 4876059416
model-00007-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30ad23d711a3bab26281398c83802076d340549021872734909fcaacb632f743
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eda2c69a651637e2df148955c69db6c8c907ca8bf30ced192fa7ca806a8b2371
3
  size 4876059416
model-00008-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:695f56dbcb59428a1f5180716cc25446a175a321eb1951dc05f6bdcfb5a7e15d
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fbcbd64c81b04683bb3485e92cc4d628741e4783402d609317dff288ac00184
3
  size 4876059416
model-00009-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70f8b876d5104d74b0bf0a54512ddd205e0129f3462dbb8511bc72d30c75bba9
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3211f631d19fab00c0a1ca04c77c08d73be82acd2e07fe40625c5831154dbed
3
  size 4876059416
model-00010-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1575feae00b83a92cfbae296cb44856025dacfede307d5d5b8983045c2c68a25
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3718145eaf4d7f140bb0d95ac7fbc9d9af6dbe4b72d0402d7ce5561418cbcf14
3
  size 4876059416
model-00011-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54c884bda229860abfe484f81db288e5be47542155d0ebece4e2153d293b64cf
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9970647b254c9104278d2ee5d73eb1e5ed3019ef4eef63eec7460117e950e0a1
3
  size 4876059416
model-00012-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b6132b2b3f25cd804408354591491d6a0efd2de1f21f5828018cb0227ffc397
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f47f0553f0e282ef713dabff5c89ab77e4d49197423e7d8c5707421e92ac5546
3
  size 4876059416
model-00013-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7a6087d76960c15c84dd8b4369c3a783388f3be7e88cb4e0b6cbfb1b11c47a9
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78f9c21b0f9d79b5bd53177f0d000f5841c95ad45cad332d162781c0b4baca8d
3
  size 4876059416
model-00014-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ddfe9614e2167cff3753e94d638ca47198bb5acf809a8efd30f253ecceab9ba
3
  size 2123397800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:276b63bcf000b85448d8a6eb1f9e5e6199a7ca59d63bf5a8d7a38384c25ff059
3
  size 2123397800
trainer_log.jsonl CHANGED
@@ -299,3 +299,58 @@
299
  {"current_steps": 299, "total_steps": 355, "loss": 1.5387, "lr": 1.3319878903820682e-06, "epoch": 0.8403302301071491, "percentage": 84.23, "elapsed_time": "1 day, 9:03:46", "remaining_time": "6:11:32"}
300
  {"current_steps": 300, "total_steps": 355, "loss": 1.54, "lr": 1.2858795279787517e-06, "epoch": 0.843140699104163, "percentage": 84.51, "elapsed_time": "1 day, 9:10:19", "remaining_time": "6:04:53"}
301
  {"current_steps": 301, "total_steps": 355, "loss": 1.5496, "lr": 1.2405284523254823e-06, "epoch": 0.8459511681011769, "percentage": 84.79, "elapsed_time": "1 day, 9:24:48", "remaining_time": "5:59:39"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
299
  {"current_steps": 299, "total_steps": 355, "loss": 1.5387, "lr": 1.3319878903820682e-06, "epoch": 0.8403302301071491, "percentage": 84.23, "elapsed_time": "1 day, 9:03:46", "remaining_time": "6:11:32"}
300
  {"current_steps": 300, "total_steps": 355, "loss": 1.54, "lr": 1.2858795279787517e-06, "epoch": 0.843140699104163, "percentage": 84.51, "elapsed_time": "1 day, 9:10:19", "remaining_time": "6:04:53"}
301
  {"current_steps": 301, "total_steps": 355, "loss": 1.5496, "lr": 1.2405284523254823e-06, "epoch": 0.8459511681011769, "percentage": 84.79, "elapsed_time": "1 day, 9:24:48", "remaining_time": "5:59:39"}
302
+ {"current_steps": 302, "total_steps": 355, "loss": 1.5274, "lr": 1.195938604585205e-06, "epoch": 0.8487616370981907, "percentage": 85.07, "elapsed_time": "1 day, 9:31:30", "remaining_time": "5:53:00"}
303
+ {"current_steps": 303, "total_steps": 355, "loss": 1.5437, "lr": 1.152113859767565e-06, "epoch": 0.8515721060952046, "percentage": 85.35, "elapsed_time": "1 day, 9:38:08", "remaining_time": "5:46:20"}
304
+ {"current_steps": 304, "total_steps": 355, "loss": 1.5395, "lr": 1.109058026392158e-06, "epoch": 0.8543825750922185, "percentage": 85.63, "elapsed_time": "1 day, 9:44:49", "remaining_time": "5:39:41"}
305
+ {"current_steps": 305, "total_steps": 355, "loss": 1.5487, "lr": 1.0667748461575544e-06, "epoch": 0.8571930440892324, "percentage": 85.92, "elapsed_time": "1 day, 9:51:34", "remaining_time": "5:33:02"}
306
+ {"current_steps": 306, "total_steps": 355, "loss": 1.5374, "lr": 1.0252679936161392e-06, "epoch": 0.8600035130862462, "percentage": 86.2, "elapsed_time": "1 day, 9:58:14", "remaining_time": "5:26:23"}
307
+ {"current_steps": 307, "total_steps": 355, "loss": 1.5412, "lr": 9.845410758547724e-07, "epoch": 0.8628139820832601, "percentage": 86.48, "elapsed_time": "1 day, 10:04:52", "remaining_time": "5:19:43"}
308
+ {"current_steps": 308, "total_steps": 355, "loss": 1.5295, "lr": 9.445976321813277e-07, "epoch": 0.865624451080274, "percentage": 86.76, "elapsed_time": "1 day, 10:11:29", "remaining_time": "5:13:03"}
309
+ {"current_steps": 309, "total_steps": 355, "loss": 1.5474, "lr": 9.054411338171099e-07, "epoch": 0.868434920077288, "percentage": 87.04, "elapsed_time": "1 day, 10:18:10", "remaining_time": "5:06:23"}
310
+ {"current_steps": 310, "total_steps": 355, "loss": 1.5425, "lr": 8.670749835951964e-07, "epoch": 0.8712453890743018, "percentage": 87.32, "elapsed_time": "1 day, 10:24:48", "remaining_time": "4:59:43"}
311
+ {"current_steps": 311, "total_steps": 355, "loss": 1.5412, "lr": 8.29502515664723e-07, "epoch": 0.8740558580713157, "percentage": 87.61, "elapsed_time": "1 day, 10:31:31", "remaining_time": "4:53:04"}
312
+ {"current_steps": 312, "total_steps": 355, "loss": 1.5589, "lr": 7.927269952011285e-07, "epoch": 0.8768663270683296, "percentage": 87.89, "elapsed_time": "1 day, 10:38:11", "remaining_time": "4:46:25"}
313
+ {"current_steps": 313, "total_steps": 355, "loss": 1.5504, "lr": 7.567516181223966e-07, "epoch": 0.8796767960653434, "percentage": 88.17, "elapsed_time": "1 day, 10:44:54", "remaining_time": "4:39:45"}
314
+ {"current_steps": 314, "total_steps": 355, "loss": 1.5391, "lr": 7.215795108113343e-07, "epoch": 0.8824872650623573, "percentage": 88.45, "elapsed_time": "1 day, 10:51:32", "remaining_time": "4:33:05"}
315
+ {"current_steps": 315, "total_steps": 355, "loss": 1.5354, "lr": 6.872137298438653e-07, "epoch": 0.8852977340593712, "percentage": 88.73, "elapsed_time": "1 day, 10:58:09", "remaining_time": "4:26:26"}
316
+ {"current_steps": 316, "total_steps": 355, "loss": 1.5449, "lr": 6.536572617234082e-07, "epoch": 0.888108203056385, "percentage": 89.01, "elapsed_time": "1 day, 11:04:47", "remaining_time": "4:19:46"}
317
+ {"current_steps": 317, "total_steps": 355, "loss": 1.5544, "lr": 6.209130226213378e-07, "epoch": 0.8909186720533989, "percentage": 89.3, "elapsed_time": "1 day, 11:11:27", "remaining_time": "4:13:06"}
318
+ {"current_steps": 318, "total_steps": 355, "loss": 1.5425, "lr": 5.889838581235641e-07, "epoch": 0.8937291410504128, "percentage": 89.58, "elapsed_time": "1 day, 11:18:06", "remaining_time": "4:06:26"}
319
+ {"current_steps": 319, "total_steps": 355, "loss": 1.5287, "lr": 5.578725429832344e-07, "epoch": 0.8965396100474267, "percentage": 89.86, "elapsed_time": "1 day, 11:24:43", "remaining_time": "3:59:46"}
320
+ {"current_steps": 320, "total_steps": 355, "loss": 1.5399, "lr": 5.275817808796013e-07, "epoch": 0.8993500790444405, "percentage": 90.14, "elapsed_time": "1 day, 11:31:21", "remaining_time": "3:53:07"}
321
+ {"current_steps": 321, "total_steps": 355, "loss": 1.5373, "lr": 4.981142041830645e-07, "epoch": 0.9021605480414544, "percentage": 90.42, "elapsed_time": "1 day, 11:37:57", "remaining_time": "3:46:27"}
322
+ {"current_steps": 322, "total_steps": 355, "loss": 1.5372, "lr": 4.6947237372640954e-07, "epoch": 0.9049710170384683, "percentage": 90.7, "elapsed_time": "1 day, 11:44:35", "remaining_time": "3:39:47"}
323
+ {"current_steps": 323, "total_steps": 355, "loss": 1.5412, "lr": 4.416587785822568e-07, "epoch": 0.9077814860354821, "percentage": 90.99, "elapsed_time": "1 day, 11:51:18", "remaining_time": "3:33:07"}
324
+ {"current_steps": 324, "total_steps": 355, "loss": 1.541, "lr": 4.1467583584676395e-07, "epoch": 0.910591955032496, "percentage": 91.27, "elapsed_time": "1 day, 11:57:57", "remaining_time": "3:26:28"}
325
+ {"current_steps": 325, "total_steps": 355, "loss": 1.539, "lr": 3.885258904295575e-07, "epoch": 0.9134024240295099, "percentage": 91.55, "elapsed_time": "1 day, 12:04:36", "remaining_time": "3:19:48"}
326
+ {"current_steps": 326, "total_steps": 355, "loss": 1.5313, "lr": 3.6321121484996447e-07, "epoch": 0.9162128930265238, "percentage": 91.83, "elapsed_time": "1 day, 12:11:16", "remaining_time": "3:13:09"}
327
+ {"current_steps": 327, "total_steps": 355, "loss": 1.5396, "lr": 3.3873400903951636e-07, "epoch": 0.9190233620235376, "percentage": 92.11, "elapsed_time": "1 day, 12:17:51", "remaining_time": "3:06:29"}
328
+ {"current_steps": 328, "total_steps": 355, "loss": 1.5471, "lr": 3.1509640015076946e-07, "epoch": 0.9218338310205516, "percentage": 92.39, "elapsed_time": "1 day, 12:24:25", "remaining_time": "2:59:48"}
329
+ {"current_steps": 329, "total_steps": 355, "loss": 1.5302, "lr": 2.923004423724474e-07, "epoch": 0.9246443000175655, "percentage": 92.68, "elapsed_time": "1 day, 12:30:57", "remaining_time": "2:53:08"}
330
+ {"current_steps": 330, "total_steps": 355, "loss": 1.5387, "lr": 2.703481167509281e-07, "epoch": 0.9274547690145793, "percentage": 92.96, "elapsed_time": "1 day, 12:37:35", "remaining_time": "2:46:29"}
331
+ {"current_steps": 331, "total_steps": 355, "loss": 1.5379, "lr": 2.4924133101807636e-07, "epoch": 0.9302652380115932, "percentage": 93.24, "elapsed_time": "1 day, 12:44:11", "remaining_time": "2:39:49"}
332
+ {"current_steps": 332, "total_steps": 355, "loss": 1.54, "lr": 2.289819194254661e-07, "epoch": 0.9330757070086071, "percentage": 93.52, "elapsed_time": "1 day, 12:50:48", "remaining_time": "2:33:09"}
333
+ {"current_steps": 333, "total_steps": 355, "loss": 1.5413, "lr": 2.0957164258497031e-07, "epoch": 0.935886176005621, "percentage": 93.8, "elapsed_time": "1 day, 12:57:19", "remaining_time": "2:26:29"}
334
+ {"current_steps": 334, "total_steps": 355, "loss": 1.5547, "lr": 1.9101218731575777e-07, "epoch": 0.9386966450026348, "percentage": 94.08, "elapsed_time": "1 day, 13:03:50", "remaining_time": "2:19:49"}
335
+ {"current_steps": 335, "total_steps": 355, "loss": 1.5374, "lr": 1.73305166497707e-07, "epoch": 0.9415071139996487, "percentage": 94.37, "elapsed_time": "1 day, 13:10:27", "remaining_time": "2:13:09"}
336
+ {"current_steps": 336, "total_steps": 355, "loss": 1.5449, "lr": 1.5645211893123846e-07, "epoch": 0.9443175829966626, "percentage": 94.65, "elapsed_time": "1 day, 13:17:01", "remaining_time": "2:06:29"}
337
+ {"current_steps": 337, "total_steps": 355, "loss": 1.5418, "lr": 1.4045450920358917e-07, "epoch": 0.9471280519936764, "percentage": 94.93, "elapsed_time": "1 day, 13:23:35", "remaining_time": "1:59:50"}
338
+ {"current_steps": 338, "total_steps": 355, "loss": 1.5451, "lr": 1.2531372756153458e-07, "epoch": 0.9499385209906903, "percentage": 95.21, "elapsed_time": "1 day, 13:30:09", "remaining_time": "1:53:10"}
339
+ {"current_steps": 339, "total_steps": 355, "loss": 1.5329, "lr": 1.1103108979056865e-07, "epoch": 0.9527489899877042, "percentage": 95.49, "elapsed_time": "1 day, 13:36:42", "remaining_time": "1:46:30"}
340
+ {"current_steps": 340, "total_steps": 355, "loss": 1.5399, "lr": 9.760783710056176e-08, "epoch": 0.9555594589847181, "percentage": 95.77, "elapsed_time": "1 day, 13:43:15", "remaining_time": "1:39:50"}
341
+ {"current_steps": 341, "total_steps": 355, "loss": 1.5372, "lr": 8.504513601789388e-08, "epoch": 0.9583699279817319, "percentage": 96.06, "elapsed_time": "1 day, 13:49:47", "remaining_time": "1:33:11"}
342
+ {"current_steps": 342, "total_steps": 355, "loss": 1.5415, "lr": 7.334407828407885e-08, "epoch": 0.9611803969787458, "percentage": 96.34, "elapsed_time": "1 day, 13:56:19", "remaining_time": "1:26:31"}
343
+ {"current_steps": 343, "total_steps": 355, "loss": 1.5388, "lr": 6.250568076088814e-08, "epoch": 0.9639908659757597, "percentage": 96.62, "elapsed_time": "1 day, 14:02:50", "remaining_time": "1:19:51"}
344
+ {"current_steps": 344, "total_steps": 355, "loss": 1.5385, "lr": 5.2530885341982586e-08, "epoch": 0.9668013349727735, "percentage": 96.9, "elapsed_time": "1 day, 14:09:22", "remaining_time": "1:13:12"}
345
+ {"current_steps": 345, "total_steps": 355, "loss": 1.5447, "lr": 4.3420558871060116e-08, "epoch": 0.9696118039697874, "percentage": 97.18, "elapsed_time": "1 day, 14:15:52", "remaining_time": "1:06:32"}
346
+ {"current_steps": 346, "total_steps": 355, "loss": 1.538, "lr": 3.517549306652157e-08, "epoch": 0.9724222729668013, "percentage": 97.46, "elapsed_time": "1 day, 14:22:25", "remaining_time": "0:59:53"}
347
+ {"current_steps": 347, "total_steps": 355, "loss": 1.5506, "lr": 2.7796404452666847e-08, "epoch": 0.9752327419638153, "percentage": 97.75, "elapsed_time": "1 day, 14:28:55", "remaining_time": "0:53:13"}
348
+ {"current_steps": 348, "total_steps": 355, "loss": 1.5365, "lr": 2.1283934297432472e-08, "epoch": 0.9780432109608291, "percentage": 98.03, "elapsed_time": "1 day, 14:35:25", "remaining_time": "0:46:34"}
349
+ {"current_steps": 349, "total_steps": 355, "loss": 1.5406, "lr": 1.5638648556656198e-08, "epoch": 0.980853679957843, "percentage": 98.31, "elapsed_time": "1 day, 14:42:00", "remaining_time": "0:39:55"}
350
+ {"current_steps": 350, "total_steps": 355, "loss": 1.5474, "lr": 1.0861037824896337e-08, "epoch": 0.9836641489548569, "percentage": 98.59, "elapsed_time": "1 day, 14:48:31", "remaining_time": "0:33:15"}
351
+ {"current_steps": 351, "total_steps": 355, "loss": 1.5417, "lr": 6.951517292800303e-09, "epoch": 0.9864746179518707, "percentage": 98.87, "elapsed_time": "1 day, 14:55:01", "remaining_time": "0:26:36"}
352
+ {"current_steps": 352, "total_steps": 355, "loss": 1.5369, "lr": 3.9104267110168235e-09, "epoch": 0.9892850869488846, "percentage": 99.15, "elapsed_time": "1 day, 15:01:33", "remaining_time": "0:19:57"}
353
+ {"current_steps": 353, "total_steps": 355, "loss": 1.5488, "lr": 1.738030360677323e-09, "epoch": 0.9920955559458985, "percentage": 99.44, "elapsed_time": "1 day, 15:08:06", "remaining_time": "0:13:18"}
354
+ {"current_steps": 354, "total_steps": 355, "loss": 1.5375, "lr": 4.3451703042207694e-10, "epoch": 0.9949060249429124, "percentage": 99.72, "elapsed_time": "1 day, 15:14:37", "remaining_time": "0:06:39"}
355
+ {"current_steps": 355, "total_steps": 355, "loss": 1.5352, "lr": 0.0, "epoch": 0.9977164939399262, "percentage": 100.0, "elapsed_time": "1 day, 15:21:11", "remaining_time": "0:00:00"}
356
+ {"current_steps": 355, "total_steps": 355, "epoch": 0.9977164939399262, "percentage": 100.0, "elapsed_time": "1 day, 15:29:13", "remaining_time": "0:00:00"}