diff --git "a/model2/trainer_state.json" "b/model2/trainer_state.json" new file mode 100644--- /dev/null +++ "b/model2/trainer_state.json" @@ -0,0 +1,87290 @@ +{ + "best_global_step": null, + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0001283579352709, + "eval_steps": 500, + "global_step": 109070, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 9.168423947923352e-05, + "learning_rate": 0.00019998349683689374, + "loss": 1.923, + "mean_token_accuracy": 0.5671112179756165, + "num_tokens": 23240.0, + "step": 10 + }, + { + "epoch": 0.00018336847895846704, + "learning_rate": 0.0001999651599889979, + "loss": 1.3823, + "mean_token_accuracy": 0.6590937197208404, + "num_tokens": 46441.0, + "step": 20 + }, + { + "epoch": 0.0002750527184377006, + "learning_rate": 0.00019994682314110205, + "loss": 1.2459, + "mean_token_accuracy": 0.6675321936607361, + "num_tokens": 69296.0, + "step": 30 + }, + { + "epoch": 0.0003667369579169341, + "learning_rate": 0.00019992848629320618, + "loss": 1.1608, + "mean_token_accuracy": 0.6786929786205291, + "num_tokens": 92571.0, + "step": 40 + }, + { + "epoch": 0.0004584211973961676, + "learning_rate": 0.00019991014944531038, + "loss": 1.1545, + "mean_token_accuracy": 0.6873579978942871, + "num_tokens": 115866.0, + "step": 50 + }, + { + "epoch": 0.0005501054368754011, + "learning_rate": 0.00019989181259741452, + "loss": 1.0964, + "mean_token_accuracy": 0.6990690946578979, + "num_tokens": 138611.0, + "step": 60 + }, + { + "epoch": 0.0006417896763546347, + "learning_rate": 0.00019987347574951868, + "loss": 1.081, + "mean_token_accuracy": 0.7047873675823212, + "num_tokens": 162354.0, + "step": 70 + }, + { + "epoch": 0.0007334739158338682, + "learning_rate": 0.00019985513890162282, + "loss": 1.1199, + "mean_token_accuracy": 0.6927294492721557, + "num_tokens": 185436.0, + "step": 80 + }, + { + "epoch": 0.0008251581553131017, + "learning_rate": 0.00019983680205372696, + "loss": 1.0239, + "mean_token_accuracy": 0.7098340153694153, + "num_tokens": 209182.0, + "step": 90 + }, + { + "epoch": 0.0009168423947923352, + "learning_rate": 0.00019981846520583112, + "loss": 1.0153, + "mean_token_accuracy": 0.7134263336658477, + "num_tokens": 232622.0, + "step": 100 + }, + { + "epoch": 0.0010085266342715687, + "learning_rate": 0.0001998001283579353, + "loss": 1.0558, + "mean_token_accuracy": 0.7057909607887268, + "num_tokens": 255986.0, + "step": 110 + }, + { + "epoch": 0.0011002108737508023, + "learning_rate": 0.00019978179151003945, + "loss": 1.0556, + "mean_token_accuracy": 0.7068513870239258, + "num_tokens": 278812.0, + "step": 120 + }, + { + "epoch": 0.0011918951132300357, + "learning_rate": 0.0001997634546621436, + "loss": 1.1141, + "mean_token_accuracy": 0.6901987969875336, + "num_tokens": 301968.0, + "step": 130 + }, + { + "epoch": 0.0012835793527092693, + "learning_rate": 0.00019974511781424773, + "loss": 1.0658, + "mean_token_accuracy": 0.709293419122696, + "num_tokens": 325897.0, + "step": 140 + }, + { + "epoch": 0.0013752635921885027, + "learning_rate": 0.0001997267809663519, + "loss": 1.0533, + "mean_token_accuracy": 0.7050972282886505, + "num_tokens": 348899.0, + "step": 150 + }, + { + "epoch": 0.0014669478316677363, + "learning_rate": 0.00019970844411845603, + "loss": 1.0351, + "mean_token_accuracy": 0.7042410492897033, + "num_tokens": 372353.0, + "step": 160 + }, + { + "epoch": 0.00155863207114697, + "learning_rate": 0.0001996901072705602, + "loss": 1.0595, + "mean_token_accuracy": 0.7090585947036743, + "num_tokens": 395742.0, + "step": 170 + }, + { + "epoch": 0.0016503163106262033, + "learning_rate": 0.00019967177042266436, + "loss": 1.0508, + "mean_token_accuracy": 0.7078003644943237, + "num_tokens": 418213.0, + "step": 180 + }, + { + "epoch": 0.001742000550105437, + "learning_rate": 0.0001996534335747685, + "loss": 1.0229, + "mean_token_accuracy": 0.7085508227348327, + "num_tokens": 441971.0, + "step": 190 + }, + { + "epoch": 0.0018336847895846704, + "learning_rate": 0.00019963509672687267, + "loss": 1.0318, + "mean_token_accuracy": 0.7104375839233399, + "num_tokens": 465422.0, + "step": 200 + }, + { + "epoch": 0.001925369029063904, + "learning_rate": 0.0001996167598789768, + "loss": 1.0309, + "mean_token_accuracy": 0.714245331287384, + "num_tokens": 487928.0, + "step": 210 + }, + { + "epoch": 0.0020170532685431374, + "learning_rate": 0.00019959842303108097, + "loss": 1.0399, + "mean_token_accuracy": 0.7037406146526337, + "num_tokens": 512219.0, + "step": 220 + }, + { + "epoch": 0.002108737508022371, + "learning_rate": 0.0001995800861831851, + "loss": 1.0346, + "mean_token_accuracy": 0.7041298568248748, + "num_tokens": 535130.0, + "step": 230 + }, + { + "epoch": 0.0022004217475016046, + "learning_rate": 0.00019956174933528928, + "loss": 1.0245, + "mean_token_accuracy": 0.7015379905700684, + "num_tokens": 558131.0, + "step": 240 + }, + { + "epoch": 0.0022921059869808378, + "learning_rate": 0.00019954341248739344, + "loss": 1.0207, + "mean_token_accuracy": 0.7124298512935638, + "num_tokens": 580761.0, + "step": 250 + }, + { + "epoch": 0.0023837902264600714, + "learning_rate": 0.00019952507563949758, + "loss": 1.0441, + "mean_token_accuracy": 0.7096422195434571, + "num_tokens": 604278.0, + "step": 260 + }, + { + "epoch": 0.002475474465939305, + "learning_rate": 0.00019950673879160174, + "loss": 1.047, + "mean_token_accuracy": 0.7109373688697815, + "num_tokens": 627516.0, + "step": 270 + }, + { + "epoch": 0.0025671587054185386, + "learning_rate": 0.00019948840194370588, + "loss": 0.9743, + "mean_token_accuracy": 0.7240226328372955, + "num_tokens": 651591.0, + "step": 280 + }, + { + "epoch": 0.0026588429448977722, + "learning_rate": 0.00019947006509581002, + "loss": 1.0425, + "mean_token_accuracy": 0.7046778917312622, + "num_tokens": 674320.0, + "step": 290 + }, + { + "epoch": 0.0027505271843770054, + "learning_rate": 0.0001994517282479142, + "loss": 0.9836, + "mean_token_accuracy": 0.7111404120922089, + "num_tokens": 697451.0, + "step": 300 + }, + { + "epoch": 0.002842211423856239, + "learning_rate": 0.00019943339140001835, + "loss": 1.0388, + "mean_token_accuracy": 0.708145147562027, + "num_tokens": 721193.0, + "step": 310 + }, + { + "epoch": 0.0029338956633354727, + "learning_rate": 0.00019941505455212252, + "loss": 1.0164, + "mean_token_accuracy": 0.7146294176578522, + "num_tokens": 744067.0, + "step": 320 + }, + { + "epoch": 0.0030255799028147063, + "learning_rate": 0.00019939671770422666, + "loss": 1.032, + "mean_token_accuracy": 0.7135140478610993, + "num_tokens": 767476.0, + "step": 330 + }, + { + "epoch": 0.00311726414229394, + "learning_rate": 0.0001993783808563308, + "loss": 1.0081, + "mean_token_accuracy": 0.7130200088024139, + "num_tokens": 790545.0, + "step": 340 + }, + { + "epoch": 0.003208948381773173, + "learning_rate": 0.00019936004400843496, + "loss": 0.9808, + "mean_token_accuracy": 0.721145749092102, + "num_tokens": 813522.0, + "step": 350 + }, + { + "epoch": 0.0033006326212524067, + "learning_rate": 0.0001993417071605391, + "loss": 0.9681, + "mean_token_accuracy": 0.7215366899967194, + "num_tokens": 836771.0, + "step": 360 + }, + { + "epoch": 0.0033923168607316403, + "learning_rate": 0.00019932337031264326, + "loss": 1.0226, + "mean_token_accuracy": 0.7119088530540466, + "num_tokens": 859901.0, + "step": 370 + }, + { + "epoch": 0.003484001100210874, + "learning_rate": 0.00019930503346474743, + "loss": 0.9835, + "mean_token_accuracy": 0.7127217948436737, + "num_tokens": 883177.0, + "step": 380 + }, + { + "epoch": 0.003575685339690107, + "learning_rate": 0.00019928669661685157, + "loss": 0.999, + "mean_token_accuracy": 0.7090746223926544, + "num_tokens": 907431.0, + "step": 390 + }, + { + "epoch": 0.0036673695791693407, + "learning_rate": 0.00019926835976895573, + "loss": 1.0289, + "mean_token_accuracy": 0.7040601015090943, + "num_tokens": 930277.0, + "step": 400 + }, + { + "epoch": 0.0037590538186485743, + "learning_rate": 0.00019925002292105987, + "loss": 1.0032, + "mean_token_accuracy": 0.7104796707630158, + "num_tokens": 952904.0, + "step": 410 + }, + { + "epoch": 0.003850738058127808, + "learning_rate": 0.00019923168607316404, + "loss": 1.028, + "mean_token_accuracy": 0.7142015218734741, + "num_tokens": 976112.0, + "step": 420 + }, + { + "epoch": 0.0039424222976070416, + "learning_rate": 0.00019921334922526817, + "loss": 1.0175, + "mean_token_accuracy": 0.7111793398857117, + "num_tokens": 1000129.0, + "step": 430 + }, + { + "epoch": 0.004034106537086275, + "learning_rate": 0.00019919501237737234, + "loss": 1.0108, + "mean_token_accuracy": 0.7194611966609955, + "num_tokens": 1024034.0, + "step": 440 + }, + { + "epoch": 0.004125790776565509, + "learning_rate": 0.0001991766755294765, + "loss": 1.001, + "mean_token_accuracy": 0.7095412254333496, + "num_tokens": 1047274.0, + "step": 450 + }, + { + "epoch": 0.004217475016044742, + "learning_rate": 0.00019915833868158064, + "loss": 1.0316, + "mean_token_accuracy": 0.7048232853412628, + "num_tokens": 1070814.0, + "step": 460 + }, + { + "epoch": 0.004309159255523975, + "learning_rate": 0.0001991400018336848, + "loss": 1.0021, + "mean_token_accuracy": 0.7127786338329315, + "num_tokens": 1093506.0, + "step": 470 + }, + { + "epoch": 0.004400843495003209, + "learning_rate": 0.00019912166498578895, + "loss": 1.0864, + "mean_token_accuracy": 0.6990128040313721, + "num_tokens": 1116273.0, + "step": 480 + }, + { + "epoch": 0.004492527734482442, + "learning_rate": 0.00019910332813789309, + "loss": 0.9868, + "mean_token_accuracy": 0.7214479863643646, + "num_tokens": 1139494.0, + "step": 490 + }, + { + "epoch": 0.0045842119739616756, + "learning_rate": 0.00019908499128999728, + "loss": 1.0224, + "mean_token_accuracy": 0.7078819572925568, + "num_tokens": 1162185.0, + "step": 500 + }, + { + "epoch": 0.00467589621344091, + "learning_rate": 0.00019906665444210142, + "loss": 0.9564, + "mean_token_accuracy": 0.7251663327217102, + "num_tokens": 1185649.0, + "step": 510 + }, + { + "epoch": 0.004767580452920143, + "learning_rate": 0.00019904831759420558, + "loss": 1.0394, + "mean_token_accuracy": 0.7065913915634155, + "num_tokens": 1208749.0, + "step": 520 + }, + { + "epoch": 0.004859264692399377, + "learning_rate": 0.00019902998074630972, + "loss": 0.9923, + "mean_token_accuracy": 0.7146309971809387, + "num_tokens": 1232124.0, + "step": 530 + }, + { + "epoch": 0.00495094893187861, + "learning_rate": 0.00019901164389841386, + "loss": 1.0036, + "mean_token_accuracy": 0.717809009552002, + "num_tokens": 1255100.0, + "step": 540 + }, + { + "epoch": 0.005042633171357843, + "learning_rate": 0.00019899330705051802, + "loss": 1.0539, + "mean_token_accuracy": 0.7106794893741608, + "num_tokens": 1278052.0, + "step": 550 + }, + { + "epoch": 0.005134317410837077, + "learning_rate": 0.00019897497020262216, + "loss": 1.0064, + "mean_token_accuracy": 0.7144601583480835, + "num_tokens": 1301376.0, + "step": 560 + }, + { + "epoch": 0.0052260016503163104, + "learning_rate": 0.00019895663335472633, + "loss": 1.0455, + "mean_token_accuracy": 0.7059086263179779, + "num_tokens": 1324700.0, + "step": 570 + }, + { + "epoch": 0.0053176858897955445, + "learning_rate": 0.0001989382965068305, + "loss": 0.9906, + "mean_token_accuracy": 0.7112154304981232, + "num_tokens": 1347260.0, + "step": 580 + }, + { + "epoch": 0.005409370129274778, + "learning_rate": 0.00019891995965893463, + "loss": 0.9914, + "mean_token_accuracy": 0.7184651911258697, + "num_tokens": 1370130.0, + "step": 590 + }, + { + "epoch": 0.005501054368754011, + "learning_rate": 0.0001989016228110388, + "loss": 0.977, + "mean_token_accuracy": 0.7227175831794739, + "num_tokens": 1393754.0, + "step": 600 + }, + { + "epoch": 0.005592738608233245, + "learning_rate": 0.00019888328596314294, + "loss": 0.9863, + "mean_token_accuracy": 0.7218797028064727, + "num_tokens": 1417095.0, + "step": 610 + }, + { + "epoch": 0.005684422847712478, + "learning_rate": 0.0001988649491152471, + "loss": 1.0015, + "mean_token_accuracy": 0.7211240470409394, + "num_tokens": 1440173.0, + "step": 620 + }, + { + "epoch": 0.005776107087191712, + "learning_rate": 0.00019884661226735127, + "loss": 0.9524, + "mean_token_accuracy": 0.7226812183856964, + "num_tokens": 1462615.0, + "step": 630 + }, + { + "epoch": 0.005867791326670945, + "learning_rate": 0.0001988282754194554, + "loss": 0.9427, + "mean_token_accuracy": 0.7317568361759186, + "num_tokens": 1485642.0, + "step": 640 + }, + { + "epoch": 0.0059594755661501785, + "learning_rate": 0.00019880993857155957, + "loss": 0.9702, + "mean_token_accuracy": 0.7181661605834961, + "num_tokens": 1508865.0, + "step": 650 + }, + { + "epoch": 0.0060511598056294125, + "learning_rate": 0.0001987916017236637, + "loss": 0.9822, + "mean_token_accuracy": 0.7227430582046509, + "num_tokens": 1531240.0, + "step": 660 + }, + { + "epoch": 0.006142844045108646, + "learning_rate": 0.00019877326487576787, + "loss": 0.9823, + "mean_token_accuracy": 0.7115278661251068, + "num_tokens": 1554582.0, + "step": 670 + }, + { + "epoch": 0.00623452828458788, + "learning_rate": 0.000198754928027872, + "loss": 1.0114, + "mean_token_accuracy": 0.71690434217453, + "num_tokens": 1577156.0, + "step": 680 + }, + { + "epoch": 0.006326212524067113, + "learning_rate": 0.00019873659117997615, + "loss": 0.9203, + "mean_token_accuracy": 0.7258795380592347, + "num_tokens": 1600592.0, + "step": 690 + }, + { + "epoch": 0.006417896763546346, + "learning_rate": 0.00019871825433208034, + "loss": 0.9611, + "mean_token_accuracy": 0.7181583404541015, + "num_tokens": 1622497.0, + "step": 700 + }, + { + "epoch": 0.00650958100302558, + "learning_rate": 0.00019869991748418448, + "loss": 0.995, + "mean_token_accuracy": 0.7175450980663299, + "num_tokens": 1645055.0, + "step": 710 + }, + { + "epoch": 0.006601265242504813, + "learning_rate": 0.00019868158063628865, + "loss": 0.9704, + "mean_token_accuracy": 0.7163600087165832, + "num_tokens": 1668230.0, + "step": 720 + }, + { + "epoch": 0.0066929494819840465, + "learning_rate": 0.00019866324378839279, + "loss": 0.9659, + "mean_token_accuracy": 0.719957035779953, + "num_tokens": 1690963.0, + "step": 730 + }, + { + "epoch": 0.006784633721463281, + "learning_rate": 0.00019864490694049692, + "loss": 0.9757, + "mean_token_accuracy": 0.7256332635879517, + "num_tokens": 1714141.0, + "step": 740 + }, + { + "epoch": 0.006876317960942514, + "learning_rate": 0.0001986265700926011, + "loss": 0.9343, + "mean_token_accuracy": 0.7251800775527955, + "num_tokens": 1737597.0, + "step": 750 + }, + { + "epoch": 0.006968002200421748, + "learning_rate": 0.00019860823324470525, + "loss": 0.9828, + "mean_token_accuracy": 0.7137405216693878, + "num_tokens": 1760673.0, + "step": 760 + }, + { + "epoch": 0.007059686439900981, + "learning_rate": 0.0001985898963968094, + "loss": 1.0008, + "mean_token_accuracy": 0.716589343547821, + "num_tokens": 1783485.0, + "step": 770 + }, + { + "epoch": 0.007151370679380214, + "learning_rate": 0.00019857155954891356, + "loss": 0.9541, + "mean_token_accuracy": 0.727026391029358, + "num_tokens": 1806277.0, + "step": 780 + }, + { + "epoch": 0.007243054918859448, + "learning_rate": 0.0001985532227010177, + "loss": 0.9587, + "mean_token_accuracy": 0.7290895402431488, + "num_tokens": 1829597.0, + "step": 790 + }, + { + "epoch": 0.007334739158338681, + "learning_rate": 0.00019853488585312186, + "loss": 0.9833, + "mean_token_accuracy": 0.7171423137187958, + "num_tokens": 1852391.0, + "step": 800 + }, + { + "epoch": 0.0074264233978179155, + "learning_rate": 0.000198516549005226, + "loss": 0.968, + "mean_token_accuracy": 0.7270346641540527, + "num_tokens": 1875683.0, + "step": 810 + }, + { + "epoch": 0.007518107637297149, + "learning_rate": 0.00019849821215733017, + "loss": 1.0124, + "mean_token_accuracy": 0.7099732458591461, + "num_tokens": 1899044.0, + "step": 820 + }, + { + "epoch": 0.007609791876776382, + "learning_rate": 0.00019847987530943433, + "loss": 0.9879, + "mean_token_accuracy": 0.7223415613174439, + "num_tokens": 1922578.0, + "step": 830 + }, + { + "epoch": 0.007701476116255616, + "learning_rate": 0.00019846153846153847, + "loss": 1.0117, + "mean_token_accuracy": 0.710689491033554, + "num_tokens": 1945702.0, + "step": 840 + }, + { + "epoch": 0.007793160355734849, + "learning_rate": 0.00019844320161364263, + "loss": 1.0074, + "mean_token_accuracy": 0.7130803108215332, + "num_tokens": 1968971.0, + "step": 850 + }, + { + "epoch": 0.007884844595214083, + "learning_rate": 0.00019842486476574677, + "loss": 0.9564, + "mean_token_accuracy": 0.7260822772979736, + "num_tokens": 1992042.0, + "step": 860 + }, + { + "epoch": 0.007976528834693316, + "learning_rate": 0.00019840652791785094, + "loss": 0.9605, + "mean_token_accuracy": 0.7239135682582856, + "num_tokens": 2014709.0, + "step": 870 + }, + { + "epoch": 0.00806821307417255, + "learning_rate": 0.00019838819106995508, + "loss": 0.9672, + "mean_token_accuracy": 0.7277372121810913, + "num_tokens": 2037689.0, + "step": 880 + }, + { + "epoch": 0.008159897313651783, + "learning_rate": 0.00019836985422205924, + "loss": 0.9373, + "mean_token_accuracy": 0.724119883775711, + "num_tokens": 2060452.0, + "step": 890 + }, + { + "epoch": 0.008251581553131018, + "learning_rate": 0.0001983515173741634, + "loss": 0.9671, + "mean_token_accuracy": 0.7217941105365753, + "num_tokens": 2083439.0, + "step": 900 + }, + { + "epoch": 0.00834326579261025, + "learning_rate": 0.00019833318052626755, + "loss": 0.9593, + "mean_token_accuracy": 0.726180350780487, + "num_tokens": 2106422.0, + "step": 910 + }, + { + "epoch": 0.008434950032089484, + "learning_rate": 0.0001983148436783717, + "loss": 0.9969, + "mean_token_accuracy": 0.7121199488639831, + "num_tokens": 2129419.0, + "step": 920 + }, + { + "epoch": 0.008526634271568717, + "learning_rate": 0.00019829650683047585, + "loss": 0.988, + "mean_token_accuracy": 0.7151882767677307, + "num_tokens": 2153284.0, + "step": 930 + }, + { + "epoch": 0.00861831851104795, + "learning_rate": 0.00019827816998258, + "loss": 0.9936, + "mean_token_accuracy": 0.7165880739688874, + "num_tokens": 2177157.0, + "step": 940 + }, + { + "epoch": 0.008710002750527185, + "learning_rate": 0.00019825983313468415, + "loss": 0.9236, + "mean_token_accuracy": 0.7331863820552826, + "num_tokens": 2199698.0, + "step": 950 + }, + { + "epoch": 0.008801686990006418, + "learning_rate": 0.00019824149628678832, + "loss": 0.9382, + "mean_token_accuracy": 0.7276931762695312, + "num_tokens": 2222343.0, + "step": 960 + }, + { + "epoch": 0.008893371229485652, + "learning_rate": 0.00019822315943889246, + "loss": 1.0353, + "mean_token_accuracy": 0.706400340795517, + "num_tokens": 2245100.0, + "step": 970 + }, + { + "epoch": 0.008985055468964885, + "learning_rate": 0.00019820482259099662, + "loss": 0.943, + "mean_token_accuracy": 0.7241316556930542, + "num_tokens": 2267882.0, + "step": 980 + }, + { + "epoch": 0.009076739708444118, + "learning_rate": 0.00019818648574310076, + "loss": 0.9818, + "mean_token_accuracy": 0.715369588136673, + "num_tokens": 2290572.0, + "step": 990 + }, + { + "epoch": 0.009168423947923351, + "learning_rate": 0.00019816814889520493, + "loss": 0.9465, + "mean_token_accuracy": 0.7224092602729797, + "num_tokens": 2312974.0, + "step": 1000 + }, + { + "epoch": 0.009260108187402586, + "learning_rate": 0.00019814981204730906, + "loss": 0.9275, + "mean_token_accuracy": 0.7284131586551666, + "num_tokens": 2336739.0, + "step": 1010 + }, + { + "epoch": 0.00935179242688182, + "learning_rate": 0.00019813147519941323, + "loss": 0.9704, + "mean_token_accuracy": 0.7230646967887878, + "num_tokens": 2360652.0, + "step": 1020 + }, + { + "epoch": 0.009443476666361052, + "learning_rate": 0.0001981131383515174, + "loss": 0.9735, + "mean_token_accuracy": 0.713595587015152, + "num_tokens": 2383611.0, + "step": 1030 + }, + { + "epoch": 0.009535160905840286, + "learning_rate": 0.00019809480150362153, + "loss": 0.9426, + "mean_token_accuracy": 0.7269194841384887, + "num_tokens": 2406931.0, + "step": 1040 + }, + { + "epoch": 0.009626845145319519, + "learning_rate": 0.0001980764646557257, + "loss": 0.9544, + "mean_token_accuracy": 0.7190650165081024, + "num_tokens": 2430341.0, + "step": 1050 + }, + { + "epoch": 0.009718529384798754, + "learning_rate": 0.00019805812780782984, + "loss": 0.9765, + "mean_token_accuracy": 0.7188243806362152, + "num_tokens": 2453112.0, + "step": 1060 + }, + { + "epoch": 0.009810213624277987, + "learning_rate": 0.000198039790959934, + "loss": 0.9685, + "mean_token_accuracy": 0.7198343932628631, + "num_tokens": 2476467.0, + "step": 1070 + }, + { + "epoch": 0.00990189786375722, + "learning_rate": 0.00019802145411203814, + "loss": 0.9433, + "mean_token_accuracy": 0.7255321025848389, + "num_tokens": 2499409.0, + "step": 1080 + }, + { + "epoch": 0.009993582103236453, + "learning_rate": 0.0001980031172641423, + "loss": 0.9668, + "mean_token_accuracy": 0.7166699886322021, + "num_tokens": 2522250.0, + "step": 1090 + }, + { + "epoch": 0.010085266342715686, + "learning_rate": 0.00019798478041624647, + "loss": 0.9958, + "mean_token_accuracy": 0.7167232811450959, + "num_tokens": 2545370.0, + "step": 1100 + }, + { + "epoch": 0.010176950582194921, + "learning_rate": 0.0001979664435683506, + "loss": 0.9621, + "mean_token_accuracy": 0.7260641932487488, + "num_tokens": 2568971.0, + "step": 1110 + }, + { + "epoch": 0.010268634821674155, + "learning_rate": 0.00019794810672045478, + "loss": 0.9318, + "mean_token_accuracy": 0.7268799662590026, + "num_tokens": 2591958.0, + "step": 1120 + }, + { + "epoch": 0.010360319061153388, + "learning_rate": 0.00019792976987255891, + "loss": 0.9242, + "mean_token_accuracy": 0.7272241413593292, + "num_tokens": 2615239.0, + "step": 1130 + }, + { + "epoch": 0.010452003300632621, + "learning_rate": 0.00019791143302466305, + "loss": 0.9699, + "mean_token_accuracy": 0.7197751224040985, + "num_tokens": 2638063.0, + "step": 1140 + }, + { + "epoch": 0.010543687540111854, + "learning_rate": 0.00019789309617676724, + "loss": 0.9832, + "mean_token_accuracy": 0.7191377222537995, + "num_tokens": 2660601.0, + "step": 1150 + }, + { + "epoch": 0.010635371779591089, + "learning_rate": 0.00019787475932887138, + "loss": 0.9897, + "mean_token_accuracy": 0.7226161777973175, + "num_tokens": 2682907.0, + "step": 1160 + }, + { + "epoch": 0.010727056019070322, + "learning_rate": 0.00019785642248097552, + "loss": 1.0066, + "mean_token_accuracy": 0.7087887823581696, + "num_tokens": 2706737.0, + "step": 1170 + }, + { + "epoch": 0.010818740258549555, + "learning_rate": 0.0001978380856330797, + "loss": 0.9805, + "mean_token_accuracy": 0.7189956307411194, + "num_tokens": 2729568.0, + "step": 1180 + }, + { + "epoch": 0.010910424498028789, + "learning_rate": 0.00019781974878518383, + "loss": 0.9767, + "mean_token_accuracy": 0.7154843866825104, + "num_tokens": 2753432.0, + "step": 1190 + }, + { + "epoch": 0.011002108737508022, + "learning_rate": 0.000197801411937288, + "loss": 0.9598, + "mean_token_accuracy": 0.7268693804740906, + "num_tokens": 2775300.0, + "step": 1200 + }, + { + "epoch": 0.011093792976987257, + "learning_rate": 0.00019778307508939213, + "loss": 0.9813, + "mean_token_accuracy": 0.7163785696029663, + "num_tokens": 2798396.0, + "step": 1210 + }, + { + "epoch": 0.01118547721646649, + "learning_rate": 0.0001977647382414963, + "loss": 0.9622, + "mean_token_accuracy": 0.7209876716136933, + "num_tokens": 2820421.0, + "step": 1220 + }, + { + "epoch": 0.011277161455945723, + "learning_rate": 0.00019774640139360046, + "loss": 0.9366, + "mean_token_accuracy": 0.7272763848304749, + "num_tokens": 2842838.0, + "step": 1230 + }, + { + "epoch": 0.011368845695424956, + "learning_rate": 0.0001977280645457046, + "loss": 0.9896, + "mean_token_accuracy": 0.7131923735141754, + "num_tokens": 2865965.0, + "step": 1240 + }, + { + "epoch": 0.01146052993490419, + "learning_rate": 0.00019770972769780876, + "loss": 0.9337, + "mean_token_accuracy": 0.7314384281635284, + "num_tokens": 2888744.0, + "step": 1250 + }, + { + "epoch": 0.011552214174383424, + "learning_rate": 0.0001976913908499129, + "loss": 0.9389, + "mean_token_accuracy": 0.7257712483406067, + "num_tokens": 2911838.0, + "step": 1260 + }, + { + "epoch": 0.011643898413862657, + "learning_rate": 0.00019767305400201707, + "loss": 0.9817, + "mean_token_accuracy": 0.7177240908145904, + "num_tokens": 2934685.0, + "step": 1270 + }, + { + "epoch": 0.01173558265334189, + "learning_rate": 0.0001976547171541212, + "loss": 0.9847, + "mean_token_accuracy": 0.7176860392093658, + "num_tokens": 2957712.0, + "step": 1280 + }, + { + "epoch": 0.011827266892821124, + "learning_rate": 0.00019763638030622537, + "loss": 0.9527, + "mean_token_accuracy": 0.7200366497039795, + "num_tokens": 2981205.0, + "step": 1290 + }, + { + "epoch": 0.011918951132300357, + "learning_rate": 0.00019761804345832954, + "loss": 0.9404, + "mean_token_accuracy": 0.7285177111625671, + "num_tokens": 3005064.0, + "step": 1300 + }, + { + "epoch": 0.012010635371779592, + "learning_rate": 0.00019759970661043367, + "loss": 0.9749, + "mean_token_accuracy": 0.7237740933895112, + "num_tokens": 3028358.0, + "step": 1310 + }, + { + "epoch": 0.012102319611258825, + "learning_rate": 0.00019758136976253784, + "loss": 0.9407, + "mean_token_accuracy": 0.7212411761283875, + "num_tokens": 3051640.0, + "step": 1320 + }, + { + "epoch": 0.012194003850738058, + "learning_rate": 0.00019756303291464198, + "loss": 0.9969, + "mean_token_accuracy": 0.7143770158290863, + "num_tokens": 3074093.0, + "step": 1330 + }, + { + "epoch": 0.012285688090217291, + "learning_rate": 0.00019754469606674612, + "loss": 0.9663, + "mean_token_accuracy": 0.721057939529419, + "num_tokens": 3097195.0, + "step": 1340 + }, + { + "epoch": 0.012377372329696525, + "learning_rate": 0.0001975263592188503, + "loss": 0.9828, + "mean_token_accuracy": 0.7231638550758361, + "num_tokens": 3120301.0, + "step": 1350 + }, + { + "epoch": 0.01246905656917576, + "learning_rate": 0.00019750802237095445, + "loss": 1.0089, + "mean_token_accuracy": 0.7083804249763489, + "num_tokens": 3143453.0, + "step": 1360 + }, + { + "epoch": 0.012560740808654993, + "learning_rate": 0.00019748968552305859, + "loss": 0.9372, + "mean_token_accuracy": 0.7232567846775055, + "num_tokens": 3166434.0, + "step": 1370 + }, + { + "epoch": 0.012652425048134226, + "learning_rate": 0.00019747134867516275, + "loss": 0.9585, + "mean_token_accuracy": 0.7252507746219635, + "num_tokens": 3189720.0, + "step": 1380 + }, + { + "epoch": 0.012744109287613459, + "learning_rate": 0.0001974530118272669, + "loss": 0.9243, + "mean_token_accuracy": 0.7273086667060852, + "num_tokens": 3213296.0, + "step": 1390 + }, + { + "epoch": 0.012835793527092692, + "learning_rate": 0.00019743467497937106, + "loss": 1.0068, + "mean_token_accuracy": 0.7107485592365265, + "num_tokens": 3236429.0, + "step": 1400 + }, + { + "epoch": 0.012927477766571925, + "learning_rate": 0.0001974163381314752, + "loss": 1.0114, + "mean_token_accuracy": 0.7163017809391021, + "num_tokens": 3259605.0, + "step": 1410 + }, + { + "epoch": 0.01301916200605116, + "learning_rate": 0.00019739800128357936, + "loss": 0.9551, + "mean_token_accuracy": 0.7215744376182556, + "num_tokens": 3282382.0, + "step": 1420 + }, + { + "epoch": 0.013110846245530394, + "learning_rate": 0.00019737966443568352, + "loss": 0.9525, + "mean_token_accuracy": 0.7207176864147187, + "num_tokens": 3305393.0, + "step": 1430 + }, + { + "epoch": 0.013202530485009627, + "learning_rate": 0.00019736132758778766, + "loss": 0.9652, + "mean_token_accuracy": 0.7264041602611542, + "num_tokens": 3328431.0, + "step": 1440 + }, + { + "epoch": 0.01329421472448886, + "learning_rate": 0.00019734299073989183, + "loss": 0.9875, + "mean_token_accuracy": 0.7188103854656219, + "num_tokens": 3351574.0, + "step": 1450 + }, + { + "epoch": 0.013385898963968093, + "learning_rate": 0.00019732465389199597, + "loss": 0.9556, + "mean_token_accuracy": 0.7261079728603363, + "num_tokens": 3375174.0, + "step": 1460 + }, + { + "epoch": 0.013477583203447328, + "learning_rate": 0.00019730631704410013, + "loss": 0.9486, + "mean_token_accuracy": 0.7252309262752533, + "num_tokens": 3399179.0, + "step": 1470 + }, + { + "epoch": 0.013569267442926561, + "learning_rate": 0.0001972879801962043, + "loss": 0.9087, + "mean_token_accuracy": 0.7351897895336151, + "num_tokens": 3423090.0, + "step": 1480 + }, + { + "epoch": 0.013660951682405794, + "learning_rate": 0.00019726964334830844, + "loss": 0.9608, + "mean_token_accuracy": 0.7285245358943939, + "num_tokens": 3446736.0, + "step": 1490 + }, + { + "epoch": 0.013752635921885028, + "learning_rate": 0.0001972513065004126, + "loss": 0.9423, + "mean_token_accuracy": 0.7259980082511902, + "num_tokens": 3470538.0, + "step": 1500 + }, + { + "epoch": 0.01384432016136426, + "learning_rate": 0.00019723296965251674, + "loss": 0.9585, + "mean_token_accuracy": 0.7208814442157745, + "num_tokens": 3493164.0, + "step": 1510 + }, + { + "epoch": 0.013936004400843496, + "learning_rate": 0.0001972146328046209, + "loss": 0.9534, + "mean_token_accuracy": 0.7244306862354278, + "num_tokens": 3515939.0, + "step": 1520 + }, + { + "epoch": 0.014027688640322729, + "learning_rate": 0.00019719629595672504, + "loss": 0.9566, + "mean_token_accuracy": 0.7232561886310578, + "num_tokens": 3539096.0, + "step": 1530 + }, + { + "epoch": 0.014119372879801962, + "learning_rate": 0.00019717795910882918, + "loss": 0.941, + "mean_token_accuracy": 0.7308221578598022, + "num_tokens": 3562532.0, + "step": 1540 + }, + { + "epoch": 0.014211057119281195, + "learning_rate": 0.00019715962226093337, + "loss": 0.9695, + "mean_token_accuracy": 0.7229514122009277, + "num_tokens": 3585952.0, + "step": 1550 + }, + { + "epoch": 0.014302741358760428, + "learning_rate": 0.0001971412854130375, + "loss": 0.9583, + "mean_token_accuracy": 0.7235263407230377, + "num_tokens": 3608803.0, + "step": 1560 + }, + { + "epoch": 0.014394425598239663, + "learning_rate": 0.00019712294856514165, + "loss": 0.9381, + "mean_token_accuracy": 0.7337869882583619, + "num_tokens": 3631898.0, + "step": 1570 + }, + { + "epoch": 0.014486109837718896, + "learning_rate": 0.00019710461171724582, + "loss": 0.9422, + "mean_token_accuracy": 0.7355702638626098, + "num_tokens": 3654752.0, + "step": 1580 + }, + { + "epoch": 0.01457779407719813, + "learning_rate": 0.00019708627486934995, + "loss": 0.9378, + "mean_token_accuracy": 0.7221675395965577, + "num_tokens": 3678326.0, + "step": 1590 + }, + { + "epoch": 0.014669478316677363, + "learning_rate": 0.00019706793802145412, + "loss": 0.9546, + "mean_token_accuracy": 0.7216339230537414, + "num_tokens": 3701736.0, + "step": 1600 + }, + { + "epoch": 0.014761162556156596, + "learning_rate": 0.00019704960117355828, + "loss": 0.9792, + "mean_token_accuracy": 0.7194464564323425, + "num_tokens": 3724626.0, + "step": 1610 + }, + { + "epoch": 0.014852846795635831, + "learning_rate": 0.00019703126432566242, + "loss": 0.9423, + "mean_token_accuracy": 0.7257243514060974, + "num_tokens": 3747992.0, + "step": 1620 + }, + { + "epoch": 0.014944531035115064, + "learning_rate": 0.0001970129274777666, + "loss": 0.9693, + "mean_token_accuracy": 0.7192770183086395, + "num_tokens": 3770426.0, + "step": 1630 + }, + { + "epoch": 0.015036215274594297, + "learning_rate": 0.00019699459062987073, + "loss": 0.9852, + "mean_token_accuracy": 0.7204219222068786, + "num_tokens": 3793564.0, + "step": 1640 + }, + { + "epoch": 0.01512789951407353, + "learning_rate": 0.0001969762537819749, + "loss": 0.9204, + "mean_token_accuracy": 0.7410035967826843, + "num_tokens": 3815840.0, + "step": 1650 + }, + { + "epoch": 0.015219583753552764, + "learning_rate": 0.00019695791693407903, + "loss": 0.9559, + "mean_token_accuracy": 0.7224495232105255, + "num_tokens": 3838591.0, + "step": 1660 + }, + { + "epoch": 0.015311267993031999, + "learning_rate": 0.0001969395800861832, + "loss": 0.8758, + "mean_token_accuracy": 0.7431340098381043, + "num_tokens": 3861813.0, + "step": 1670 + }, + { + "epoch": 0.015402952232511232, + "learning_rate": 0.00019692124323828736, + "loss": 0.9994, + "mean_token_accuracy": 0.7104192674160004, + "num_tokens": 3885929.0, + "step": 1680 + }, + { + "epoch": 0.015494636471990465, + "learning_rate": 0.0001969029063903915, + "loss": 0.9614, + "mean_token_accuracy": 0.7201364398002624, + "num_tokens": 3908600.0, + "step": 1690 + }, + { + "epoch": 0.015586320711469698, + "learning_rate": 0.00019688456954249567, + "loss": 0.9499, + "mean_token_accuracy": 0.7221241772174836, + "num_tokens": 3931576.0, + "step": 1700 + }, + { + "epoch": 0.015678004950948933, + "learning_rate": 0.0001968662326945998, + "loss": 0.9617, + "mean_token_accuracy": 0.7238831579685211, + "num_tokens": 3953883.0, + "step": 1710 + }, + { + "epoch": 0.015769689190428166, + "learning_rate": 0.00019684789584670397, + "loss": 0.9744, + "mean_token_accuracy": 0.7155179023742676, + "num_tokens": 3976360.0, + "step": 1720 + }, + { + "epoch": 0.0158613734299074, + "learning_rate": 0.0001968295589988081, + "loss": 0.9624, + "mean_token_accuracy": 0.7200638294219971, + "num_tokens": 3998956.0, + "step": 1730 + }, + { + "epoch": 0.015953057669386633, + "learning_rate": 0.00019681122215091227, + "loss": 0.9652, + "mean_token_accuracy": 0.7259124040603637, + "num_tokens": 4022236.0, + "step": 1740 + }, + { + "epoch": 0.016044741908865866, + "learning_rate": 0.00019679288530301644, + "loss": 0.9405, + "mean_token_accuracy": 0.7326333880424499, + "num_tokens": 4044454.0, + "step": 1750 + }, + { + "epoch": 0.0161364261483451, + "learning_rate": 0.00019677454845512058, + "loss": 0.9286, + "mean_token_accuracy": 0.7249843358993531, + "num_tokens": 4068244.0, + "step": 1760 + }, + { + "epoch": 0.016228110387824332, + "learning_rate": 0.00019675621160722471, + "loss": 0.9753, + "mean_token_accuracy": 0.7207641959190368, + "num_tokens": 4091048.0, + "step": 1770 + }, + { + "epoch": 0.016319794627303565, + "learning_rate": 0.00019673787475932888, + "loss": 0.9255, + "mean_token_accuracy": 0.7323376059532165, + "num_tokens": 4113954.0, + "step": 1780 + }, + { + "epoch": 0.0164114788667828, + "learning_rate": 0.00019671953791143302, + "loss": 0.9517, + "mean_token_accuracy": 0.7274047136306763, + "num_tokens": 4136647.0, + "step": 1790 + }, + { + "epoch": 0.016503163106262035, + "learning_rate": 0.00019670120106353718, + "loss": 0.9591, + "mean_token_accuracy": 0.7191266596317292, + "num_tokens": 4159354.0, + "step": 1800 + }, + { + "epoch": 0.01659484734574127, + "learning_rate": 0.00019668286421564135, + "loss": 0.9155, + "mean_token_accuracy": 0.7271833419799805, + "num_tokens": 4182599.0, + "step": 1810 + }, + { + "epoch": 0.0166865315852205, + "learning_rate": 0.0001966645273677455, + "loss": 0.9437, + "mean_token_accuracy": 0.7300412118434906, + "num_tokens": 4205609.0, + "step": 1820 + }, + { + "epoch": 0.016778215824699735, + "learning_rate": 0.00019664619051984965, + "loss": 0.9627, + "mean_token_accuracy": 0.7181828320026398, + "num_tokens": 4228312.0, + "step": 1830 + }, + { + "epoch": 0.016869900064178968, + "learning_rate": 0.0001966278536719538, + "loss": 0.9653, + "mean_token_accuracy": 0.7201115906238555, + "num_tokens": 4252258.0, + "step": 1840 + }, + { + "epoch": 0.0169615843036582, + "learning_rate": 0.00019660951682405796, + "loss": 0.9111, + "mean_token_accuracy": 0.7319241642951966, + "num_tokens": 4274681.0, + "step": 1850 + }, + { + "epoch": 0.017053268543137434, + "learning_rate": 0.0001965911799761621, + "loss": 0.932, + "mean_token_accuracy": 0.7312391996383667, + "num_tokens": 4298157.0, + "step": 1860 + }, + { + "epoch": 0.017144952782616667, + "learning_rate": 0.00019657284312826626, + "loss": 0.9014, + "mean_token_accuracy": 0.734565258026123, + "num_tokens": 4321214.0, + "step": 1870 + }, + { + "epoch": 0.0172366370220959, + "learning_rate": 0.00019655450628037043, + "loss": 0.9306, + "mean_token_accuracy": 0.7280169785022735, + "num_tokens": 4345197.0, + "step": 1880 + }, + { + "epoch": 0.017328321261575134, + "learning_rate": 0.00019653616943247456, + "loss": 0.9564, + "mean_token_accuracy": 0.7204728484153747, + "num_tokens": 4368106.0, + "step": 1890 + }, + { + "epoch": 0.01742000550105437, + "learning_rate": 0.00019651783258457873, + "loss": 0.9601, + "mean_token_accuracy": 0.712797486782074, + "num_tokens": 4391291.0, + "step": 1900 + }, + { + "epoch": 0.017511689740533604, + "learning_rate": 0.00019649949573668287, + "loss": 0.9795, + "mean_token_accuracy": 0.7219728231430054, + "num_tokens": 4414395.0, + "step": 1910 + }, + { + "epoch": 0.017603373980012837, + "learning_rate": 0.00019648115888878703, + "loss": 0.9308, + "mean_token_accuracy": 0.7315888285636902, + "num_tokens": 4438227.0, + "step": 1920 + }, + { + "epoch": 0.01769505821949207, + "learning_rate": 0.00019646282204089117, + "loss": 0.9861, + "mean_token_accuracy": 0.7164831399917603, + "num_tokens": 4460466.0, + "step": 1930 + }, + { + "epoch": 0.017786742458971303, + "learning_rate": 0.00019644448519299534, + "loss": 0.9795, + "mean_token_accuracy": 0.7084175288677216, + "num_tokens": 4483128.0, + "step": 1940 + }, + { + "epoch": 0.017878426698450536, + "learning_rate": 0.0001964261483450995, + "loss": 0.9667, + "mean_token_accuracy": 0.7209431111812592, + "num_tokens": 4505460.0, + "step": 1950 + }, + { + "epoch": 0.01797011093792977, + "learning_rate": 0.00019640781149720364, + "loss": 0.9912, + "mean_token_accuracy": 0.7063813924789428, + "num_tokens": 4528513.0, + "step": 1960 + }, + { + "epoch": 0.018061795177409003, + "learning_rate": 0.00019638947464930778, + "loss": 0.9687, + "mean_token_accuracy": 0.7258190512657166, + "num_tokens": 4552384.0, + "step": 1970 + }, + { + "epoch": 0.018153479416888236, + "learning_rate": 0.00019637113780141194, + "loss": 0.9719, + "mean_token_accuracy": 0.7236562371253967, + "num_tokens": 4575577.0, + "step": 1980 + }, + { + "epoch": 0.01824516365636747, + "learning_rate": 0.00019635280095351608, + "loss": 0.9615, + "mean_token_accuracy": 0.7232940793037415, + "num_tokens": 4598952.0, + "step": 1990 + }, + { + "epoch": 0.018336847895846702, + "learning_rate": 0.00019633446410562028, + "loss": 0.9049, + "mean_token_accuracy": 0.7341329097747803, + "num_tokens": 4623559.0, + "step": 2000 + }, + { + "epoch": 0.01842853213532594, + "learning_rate": 0.00019631612725772441, + "loss": 0.9213, + "mean_token_accuracy": 0.7316263079643249, + "num_tokens": 4646930.0, + "step": 2010 + }, + { + "epoch": 0.018520216374805172, + "learning_rate": 0.00019629779040982855, + "loss": 0.9193, + "mean_token_accuracy": 0.7297214806079865, + "num_tokens": 4669607.0, + "step": 2020 + }, + { + "epoch": 0.018611900614284405, + "learning_rate": 0.00019627945356193272, + "loss": 0.9295, + "mean_token_accuracy": 0.7318191885948181, + "num_tokens": 4692450.0, + "step": 2030 + }, + { + "epoch": 0.01870358485376364, + "learning_rate": 0.00019626111671403686, + "loss": 0.9164, + "mean_token_accuracy": 0.7271653711795807, + "num_tokens": 4715980.0, + "step": 2040 + }, + { + "epoch": 0.01879526909324287, + "learning_rate": 0.00019624277986614102, + "loss": 0.9373, + "mean_token_accuracy": 0.7283840656280518, + "num_tokens": 4739203.0, + "step": 2050 + }, + { + "epoch": 0.018886953332722105, + "learning_rate": 0.00019622444301824516, + "loss": 0.9827, + "mean_token_accuracy": 0.7198963284492492, + "num_tokens": 4762605.0, + "step": 2060 + }, + { + "epoch": 0.018978637572201338, + "learning_rate": 0.00019620610617034933, + "loss": 0.9484, + "mean_token_accuracy": 0.7245118319988251, + "num_tokens": 4786308.0, + "step": 2070 + }, + { + "epoch": 0.01907032181168057, + "learning_rate": 0.0001961877693224535, + "loss": 0.9124, + "mean_token_accuracy": 0.7333156585693359, + "num_tokens": 4810147.0, + "step": 2080 + }, + { + "epoch": 0.019162006051159804, + "learning_rate": 0.00019616943247455763, + "loss": 0.9018, + "mean_token_accuracy": 0.7366366147994995, + "num_tokens": 4832350.0, + "step": 2090 + }, + { + "epoch": 0.019253690290639038, + "learning_rate": 0.0001961510956266618, + "loss": 0.9334, + "mean_token_accuracy": 0.7254868447780609, + "num_tokens": 4855821.0, + "step": 2100 + }, + { + "epoch": 0.019345374530118274, + "learning_rate": 0.00019613275877876593, + "loss": 0.9588, + "mean_token_accuracy": 0.7224485158920289, + "num_tokens": 4878509.0, + "step": 2110 + }, + { + "epoch": 0.019437058769597507, + "learning_rate": 0.0001961144219308701, + "loss": 0.927, + "mean_token_accuracy": 0.7318493902683259, + "num_tokens": 4902071.0, + "step": 2120 + }, + { + "epoch": 0.01952874300907674, + "learning_rate": 0.00019609608508297426, + "loss": 0.9281, + "mean_token_accuracy": 0.736470353603363, + "num_tokens": 4923762.0, + "step": 2130 + }, + { + "epoch": 0.019620427248555974, + "learning_rate": 0.0001960777482350784, + "loss": 0.93, + "mean_token_accuracy": 0.7328227162361145, + "num_tokens": 4946563.0, + "step": 2140 + }, + { + "epoch": 0.019712111488035207, + "learning_rate": 0.00019605941138718257, + "loss": 0.9769, + "mean_token_accuracy": 0.7141354322433472, + "num_tokens": 4969913.0, + "step": 2150 + }, + { + "epoch": 0.01980379572751444, + "learning_rate": 0.0001960410745392867, + "loss": 0.9012, + "mean_token_accuracy": 0.7336618602275848, + "num_tokens": 4993848.0, + "step": 2160 + }, + { + "epoch": 0.019895479966993673, + "learning_rate": 0.00019602273769139084, + "loss": 0.9385, + "mean_token_accuracy": 0.7301294863224029, + "num_tokens": 5016536.0, + "step": 2170 + }, + { + "epoch": 0.019987164206472906, + "learning_rate": 0.000196004400843495, + "loss": 0.9444, + "mean_token_accuracy": 0.720094096660614, + "num_tokens": 5039552.0, + "step": 2180 + }, + { + "epoch": 0.02007884844595214, + "learning_rate": 0.00019598606399559915, + "loss": 0.9669, + "mean_token_accuracy": 0.720612359046936, + "num_tokens": 5062464.0, + "step": 2190 + }, + { + "epoch": 0.020170532685431373, + "learning_rate": 0.00019596772714770334, + "loss": 0.9375, + "mean_token_accuracy": 0.7292058229446411, + "num_tokens": 5084932.0, + "step": 2200 + }, + { + "epoch": 0.02026221692491061, + "learning_rate": 0.00019594939029980748, + "loss": 0.8964, + "mean_token_accuracy": 0.7395495593547821, + "num_tokens": 5108191.0, + "step": 2210 + }, + { + "epoch": 0.020353901164389843, + "learning_rate": 0.00019593105345191162, + "loss": 0.9611, + "mean_token_accuracy": 0.7236228704452514, + "num_tokens": 5131864.0, + "step": 2220 + }, + { + "epoch": 0.020445585403869076, + "learning_rate": 0.00019591271660401578, + "loss": 1.0113, + "mean_token_accuracy": 0.714591783285141, + "num_tokens": 5154579.0, + "step": 2230 + }, + { + "epoch": 0.02053726964334831, + "learning_rate": 0.00019589437975611992, + "loss": 0.949, + "mean_token_accuracy": 0.7267784833908081, + "num_tokens": 5177731.0, + "step": 2240 + }, + { + "epoch": 0.020628953882827542, + "learning_rate": 0.00019587604290822409, + "loss": 0.9255, + "mean_token_accuracy": 0.7317762017250061, + "num_tokens": 5201252.0, + "step": 2250 + }, + { + "epoch": 0.020720638122306775, + "learning_rate": 0.00019585770606032825, + "loss": 0.9554, + "mean_token_accuracy": 0.7194037437438965, + "num_tokens": 5224340.0, + "step": 2260 + }, + { + "epoch": 0.02081232236178601, + "learning_rate": 0.0001958393692124324, + "loss": 0.9506, + "mean_token_accuracy": 0.7309067130088807, + "num_tokens": 5247853.0, + "step": 2270 + }, + { + "epoch": 0.020904006601265242, + "learning_rate": 0.00019582103236453655, + "loss": 0.968, + "mean_token_accuracy": 0.7199053347110749, + "num_tokens": 5270539.0, + "step": 2280 + }, + { + "epoch": 0.020995690840744475, + "learning_rate": 0.0001958026955166407, + "loss": 0.9228, + "mean_token_accuracy": 0.7256809651851654, + "num_tokens": 5293157.0, + "step": 2290 + }, + { + "epoch": 0.021087375080223708, + "learning_rate": 0.00019578435866874486, + "loss": 0.9045, + "mean_token_accuracy": 0.7299234926700592, + "num_tokens": 5316419.0, + "step": 2300 + }, + { + "epoch": 0.021179059319702945, + "learning_rate": 0.000195766021820849, + "loss": 0.9354, + "mean_token_accuracy": 0.7320650398731232, + "num_tokens": 5340590.0, + "step": 2310 + }, + { + "epoch": 0.021270743559182178, + "learning_rate": 0.00019574768497295316, + "loss": 0.9831, + "mean_token_accuracy": 0.7165019750595093, + "num_tokens": 5363922.0, + "step": 2320 + }, + { + "epoch": 0.02136242779866141, + "learning_rate": 0.00019572934812505733, + "loss": 0.9671, + "mean_token_accuracy": 0.717933064699173, + "num_tokens": 5387419.0, + "step": 2330 + }, + { + "epoch": 0.021454112038140644, + "learning_rate": 0.00019571101127716147, + "loss": 0.9082, + "mean_token_accuracy": 0.7313336968421936, + "num_tokens": 5410015.0, + "step": 2340 + }, + { + "epoch": 0.021545796277619877, + "learning_rate": 0.00019569267442926563, + "loss": 0.9328, + "mean_token_accuracy": 0.7289097845554352, + "num_tokens": 5432736.0, + "step": 2350 + }, + { + "epoch": 0.02163748051709911, + "learning_rate": 0.00019567433758136977, + "loss": 0.9688, + "mean_token_accuracy": 0.7147701561450959, + "num_tokens": 5455943.0, + "step": 2360 + }, + { + "epoch": 0.021729164756578344, + "learning_rate": 0.0001956560007334739, + "loss": 0.9308, + "mean_token_accuracy": 0.7298171997070313, + "num_tokens": 5478813.0, + "step": 2370 + }, + { + "epoch": 0.021820848996057577, + "learning_rate": 0.00019563766388557807, + "loss": 0.9489, + "mean_token_accuracy": 0.7274266302585601, + "num_tokens": 5502569.0, + "step": 2380 + }, + { + "epoch": 0.02191253323553681, + "learning_rate": 0.00019561932703768224, + "loss": 0.9286, + "mean_token_accuracy": 0.7251901865005493, + "num_tokens": 5525763.0, + "step": 2390 + }, + { + "epoch": 0.022004217475016043, + "learning_rate": 0.0001956009901897864, + "loss": 0.9473, + "mean_token_accuracy": 0.727522361278534, + "num_tokens": 5548671.0, + "step": 2400 + }, + { + "epoch": 0.022095901714495277, + "learning_rate": 0.00019558265334189054, + "loss": 0.9852, + "mean_token_accuracy": 0.7218357384204864, + "num_tokens": 5571555.0, + "step": 2410 + }, + { + "epoch": 0.022187585953974513, + "learning_rate": 0.00019556431649399468, + "loss": 0.9594, + "mean_token_accuracy": 0.7173354685306549, + "num_tokens": 5594684.0, + "step": 2420 + }, + { + "epoch": 0.022279270193453746, + "learning_rate": 0.00019554597964609885, + "loss": 0.9623, + "mean_token_accuracy": 0.7192810893058776, + "num_tokens": 5617557.0, + "step": 2430 + }, + { + "epoch": 0.02237095443293298, + "learning_rate": 0.00019552764279820298, + "loss": 0.9095, + "mean_token_accuracy": 0.7417798578739166, + "num_tokens": 5640621.0, + "step": 2440 + }, + { + "epoch": 0.022462638672412213, + "learning_rate": 0.00019550930595030715, + "loss": 0.9789, + "mean_token_accuracy": 0.718708848953247, + "num_tokens": 5663739.0, + "step": 2450 + }, + { + "epoch": 0.022554322911891446, + "learning_rate": 0.00019549096910241132, + "loss": 0.969, + "mean_token_accuracy": 0.7202953457832336, + "num_tokens": 5686800.0, + "step": 2460 + }, + { + "epoch": 0.02264600715137068, + "learning_rate": 0.00019547263225451545, + "loss": 0.9173, + "mean_token_accuracy": 0.7371094405651093, + "num_tokens": 5710180.0, + "step": 2470 + }, + { + "epoch": 0.022737691390849912, + "learning_rate": 0.00019545429540661962, + "loss": 0.9098, + "mean_token_accuracy": 0.7396210551261901, + "num_tokens": 5733142.0, + "step": 2480 + }, + { + "epoch": 0.022829375630329145, + "learning_rate": 0.00019543595855872376, + "loss": 0.9503, + "mean_token_accuracy": 0.723417603969574, + "num_tokens": 5755600.0, + "step": 2490 + }, + { + "epoch": 0.02292105986980838, + "learning_rate": 0.00019541762171082792, + "loss": 0.945, + "mean_token_accuracy": 0.7276733875274658, + "num_tokens": 5778864.0, + "step": 2500 + }, + { + "epoch": 0.023012744109287612, + "learning_rate": 0.00019539928486293206, + "loss": 0.942, + "mean_token_accuracy": 0.7287339627742767, + "num_tokens": 5801942.0, + "step": 2510 + }, + { + "epoch": 0.02310442834876685, + "learning_rate": 0.00019538094801503623, + "loss": 0.9009, + "mean_token_accuracy": 0.7320193171501159, + "num_tokens": 5825136.0, + "step": 2520 + }, + { + "epoch": 0.02319611258824608, + "learning_rate": 0.0001953626111671404, + "loss": 0.9748, + "mean_token_accuracy": 0.719618844985962, + "num_tokens": 5848051.0, + "step": 2530 + }, + { + "epoch": 0.023287796827725315, + "learning_rate": 0.00019534427431924453, + "loss": 0.934, + "mean_token_accuracy": 0.7233562409877777, + "num_tokens": 5872042.0, + "step": 2540 + }, + { + "epoch": 0.023379481067204548, + "learning_rate": 0.0001953259374713487, + "loss": 0.9327, + "mean_token_accuracy": 0.7312821507453918, + "num_tokens": 5894234.0, + "step": 2550 + }, + { + "epoch": 0.02347116530668378, + "learning_rate": 0.00019530760062345283, + "loss": 0.9526, + "mean_token_accuracy": 0.7317610204219818, + "num_tokens": 5917184.0, + "step": 2560 + }, + { + "epoch": 0.023562849546163014, + "learning_rate": 0.00019528926377555697, + "loss": 0.9128, + "mean_token_accuracy": 0.7336754083633423, + "num_tokens": 5941067.0, + "step": 2570 + }, + { + "epoch": 0.023654533785642248, + "learning_rate": 0.00019527092692766114, + "loss": 0.8943, + "mean_token_accuracy": 0.7358475089073181, + "num_tokens": 5963855.0, + "step": 2580 + }, + { + "epoch": 0.02374621802512148, + "learning_rate": 0.0001952525900797653, + "loss": 0.9766, + "mean_token_accuracy": 0.7097460091114044, + "num_tokens": 5987158.0, + "step": 2590 + }, + { + "epoch": 0.023837902264600714, + "learning_rate": 0.00019523425323186947, + "loss": 0.9264, + "mean_token_accuracy": 0.729276442527771, + "num_tokens": 6010071.0, + "step": 2600 + }, + { + "epoch": 0.023929586504079947, + "learning_rate": 0.0001952159163839736, + "loss": 0.9145, + "mean_token_accuracy": 0.7364008963108063, + "num_tokens": 6032716.0, + "step": 2610 + }, + { + "epoch": 0.024021270743559184, + "learning_rate": 0.00019519757953607775, + "loss": 0.9328, + "mean_token_accuracy": 0.732559758424759, + "num_tokens": 6055494.0, + "step": 2620 + }, + { + "epoch": 0.024112954983038417, + "learning_rate": 0.0001951792426881819, + "loss": 0.9641, + "mean_token_accuracy": 0.7260844290256501, + "num_tokens": 6078113.0, + "step": 2630 + }, + { + "epoch": 0.02420463922251765, + "learning_rate": 0.00019516090584028605, + "loss": 0.9092, + "mean_token_accuracy": 0.7366998136043549, + "num_tokens": 6101402.0, + "step": 2640 + }, + { + "epoch": 0.024296323461996883, + "learning_rate": 0.00019514256899239021, + "loss": 0.9108, + "mean_token_accuracy": 0.7387801766395569, + "num_tokens": 6124010.0, + "step": 2650 + }, + { + "epoch": 0.024388007701476117, + "learning_rate": 0.00019512423214449438, + "loss": 0.8658, + "mean_token_accuracy": 0.740670245885849, + "num_tokens": 6146406.0, + "step": 2660 + }, + { + "epoch": 0.02447969194095535, + "learning_rate": 0.00019510589529659852, + "loss": 0.9599, + "mean_token_accuracy": 0.725754851102829, + "num_tokens": 6170514.0, + "step": 2670 + }, + { + "epoch": 0.024571376180434583, + "learning_rate": 0.00019508755844870268, + "loss": 0.9334, + "mean_token_accuracy": 0.7298601746559144, + "num_tokens": 6193378.0, + "step": 2680 + }, + { + "epoch": 0.024663060419913816, + "learning_rate": 0.00019506922160080682, + "loss": 0.9265, + "mean_token_accuracy": 0.7361769676208496, + "num_tokens": 6215842.0, + "step": 2690 + }, + { + "epoch": 0.02475474465939305, + "learning_rate": 0.000195050884752911, + "loss": 0.8876, + "mean_token_accuracy": 0.7371805787086487, + "num_tokens": 6238984.0, + "step": 2700 + }, + { + "epoch": 0.024846428898872282, + "learning_rate": 0.00019503254790501513, + "loss": 0.9446, + "mean_token_accuracy": 0.7247693419456482, + "num_tokens": 6262221.0, + "step": 2710 + }, + { + "epoch": 0.02493811313835152, + "learning_rate": 0.0001950142110571193, + "loss": 0.9376, + "mean_token_accuracy": 0.7261334121227264, + "num_tokens": 6285174.0, + "step": 2720 + }, + { + "epoch": 0.025029797377830752, + "learning_rate": 0.00019499587420922346, + "loss": 0.9415, + "mean_token_accuracy": 0.7219414234161377, + "num_tokens": 6307994.0, + "step": 2730 + }, + { + "epoch": 0.025121481617309985, + "learning_rate": 0.0001949775373613276, + "loss": 0.9269, + "mean_token_accuracy": 0.7352584719657898, + "num_tokens": 6331386.0, + "step": 2740 + }, + { + "epoch": 0.02521316585678922, + "learning_rate": 0.00019495920051343176, + "loss": 0.9408, + "mean_token_accuracy": 0.7218868672847748, + "num_tokens": 6354377.0, + "step": 2750 + }, + { + "epoch": 0.025304850096268452, + "learning_rate": 0.0001949408636655359, + "loss": 0.9418, + "mean_token_accuracy": 0.7339106857776642, + "num_tokens": 6377356.0, + "step": 2760 + }, + { + "epoch": 0.025396534335747685, + "learning_rate": 0.00019492252681764004, + "loss": 0.9771, + "mean_token_accuracy": 0.7172683537006378, + "num_tokens": 6400570.0, + "step": 2770 + }, + { + "epoch": 0.025488218575226918, + "learning_rate": 0.0001949041899697442, + "loss": 0.913, + "mean_token_accuracy": 0.7312417685985565, + "num_tokens": 6423983.0, + "step": 2780 + }, + { + "epoch": 0.02557990281470615, + "learning_rate": 0.00019488585312184837, + "loss": 0.9636, + "mean_token_accuracy": 0.7262275397777558, + "num_tokens": 6446226.0, + "step": 2790 + }, + { + "epoch": 0.025671587054185385, + "learning_rate": 0.00019486751627395253, + "loss": 0.9491, + "mean_token_accuracy": 0.7296705484390259, + "num_tokens": 6468335.0, + "step": 2800 + }, + { + "epoch": 0.025763271293664618, + "learning_rate": 0.00019484917942605667, + "loss": 0.9014, + "mean_token_accuracy": 0.7369650721549987, + "num_tokens": 6491446.0, + "step": 2810 + }, + { + "epoch": 0.02585495553314385, + "learning_rate": 0.0001948308425781608, + "loss": 0.9175, + "mean_token_accuracy": 0.7304332315921783, + "num_tokens": 6514073.0, + "step": 2820 + }, + { + "epoch": 0.025946639772623088, + "learning_rate": 0.00019481250573026498, + "loss": 0.9796, + "mean_token_accuracy": 0.719984632730484, + "num_tokens": 6535888.0, + "step": 2830 + }, + { + "epoch": 0.02603832401210232, + "learning_rate": 0.00019479416888236911, + "loss": 0.916, + "mean_token_accuracy": 0.729135948419571, + "num_tokens": 6559120.0, + "step": 2840 + }, + { + "epoch": 0.026130008251581554, + "learning_rate": 0.0001947758320344733, + "loss": 0.9709, + "mean_token_accuracy": 0.7150510847568512, + "num_tokens": 6582047.0, + "step": 2850 + }, + { + "epoch": 0.026221692491060787, + "learning_rate": 0.00019475749518657744, + "loss": 0.9787, + "mean_token_accuracy": 0.7159995019435883, + "num_tokens": 6605452.0, + "step": 2860 + }, + { + "epoch": 0.02631337673054002, + "learning_rate": 0.00019473915833868158, + "loss": 0.8902, + "mean_token_accuracy": 0.7358322203159332, + "num_tokens": 6628820.0, + "step": 2870 + }, + { + "epoch": 0.026405060970019253, + "learning_rate": 0.00019472082149078575, + "loss": 0.9268, + "mean_token_accuracy": 0.7268377065658569, + "num_tokens": 6651668.0, + "step": 2880 + }, + { + "epoch": 0.026496745209498487, + "learning_rate": 0.0001947024846428899, + "loss": 0.8938, + "mean_token_accuracy": 0.739132821559906, + "num_tokens": 6674632.0, + "step": 2890 + }, + { + "epoch": 0.02658842944897772, + "learning_rate": 0.00019468414779499405, + "loss": 0.9266, + "mean_token_accuracy": 0.7303313732147216, + "num_tokens": 6698564.0, + "step": 2900 + }, + { + "epoch": 0.026680113688456953, + "learning_rate": 0.0001946658109470982, + "loss": 0.9477, + "mean_token_accuracy": 0.7183525085449218, + "num_tokens": 6721992.0, + "step": 2910 + }, + { + "epoch": 0.026771797927936186, + "learning_rate": 0.00019464747409920236, + "loss": 0.9278, + "mean_token_accuracy": 0.7257976174354553, + "num_tokens": 6745472.0, + "step": 2920 + }, + { + "epoch": 0.026863482167415423, + "learning_rate": 0.00019462913725130652, + "loss": 0.9158, + "mean_token_accuracy": 0.7347129762172699, + "num_tokens": 6769153.0, + "step": 2930 + }, + { + "epoch": 0.026955166406894656, + "learning_rate": 0.00019461080040341066, + "loss": 0.9305, + "mean_token_accuracy": 0.728382408618927, + "num_tokens": 6792791.0, + "step": 2940 + }, + { + "epoch": 0.02704685064637389, + "learning_rate": 0.00019459246355551482, + "loss": 0.9253, + "mean_token_accuracy": 0.7284856557846069, + "num_tokens": 6816008.0, + "step": 2950 + }, + { + "epoch": 0.027138534885853122, + "learning_rate": 0.00019457412670761896, + "loss": 0.942, + "mean_token_accuracy": 0.7243313372135163, + "num_tokens": 6839554.0, + "step": 2960 + }, + { + "epoch": 0.027230219125332356, + "learning_rate": 0.0001945557898597231, + "loss": 0.9324, + "mean_token_accuracy": 0.7303346991539001, + "num_tokens": 6862086.0, + "step": 2970 + }, + { + "epoch": 0.02732190336481159, + "learning_rate": 0.0001945374530118273, + "loss": 0.9493, + "mean_token_accuracy": 0.7256803274154663, + "num_tokens": 6884659.0, + "step": 2980 + }, + { + "epoch": 0.027413587604290822, + "learning_rate": 0.00019451911616393143, + "loss": 0.9152, + "mean_token_accuracy": 0.7365429759025574, + "num_tokens": 6908688.0, + "step": 2990 + }, + { + "epoch": 0.027505271843770055, + "learning_rate": 0.0001945007793160356, + "loss": 0.9504, + "mean_token_accuracy": 0.7272844731807708, + "num_tokens": 6931862.0, + "step": 3000 + }, + { + "epoch": 0.02759695608324929, + "learning_rate": 0.00019448244246813974, + "loss": 0.9153, + "mean_token_accuracy": 0.7273892223834991, + "num_tokens": 6955720.0, + "step": 3010 + }, + { + "epoch": 0.02768864032272852, + "learning_rate": 0.00019446410562024387, + "loss": 0.9306, + "mean_token_accuracy": 0.7319213390350342, + "num_tokens": 6978669.0, + "step": 3020 + }, + { + "epoch": 0.027780324562207758, + "learning_rate": 0.00019444576877234804, + "loss": 0.8965, + "mean_token_accuracy": 0.732559609413147, + "num_tokens": 7001564.0, + "step": 3030 + }, + { + "epoch": 0.02787200880168699, + "learning_rate": 0.00019442743192445218, + "loss": 0.9654, + "mean_token_accuracy": 0.7271079003810883, + "num_tokens": 7025252.0, + "step": 3040 + }, + { + "epoch": 0.027963693041166224, + "learning_rate": 0.00019440909507655637, + "loss": 0.9704, + "mean_token_accuracy": 0.7184332847595215, + "num_tokens": 7048790.0, + "step": 3050 + }, + { + "epoch": 0.028055377280645458, + "learning_rate": 0.0001943907582286605, + "loss": 0.9123, + "mean_token_accuracy": 0.7326594293117523, + "num_tokens": 7072185.0, + "step": 3060 + }, + { + "epoch": 0.02814706152012469, + "learning_rate": 0.00019437242138076465, + "loss": 0.9122, + "mean_token_accuracy": 0.7348964989185334, + "num_tokens": 7095313.0, + "step": 3070 + }, + { + "epoch": 0.028238745759603924, + "learning_rate": 0.0001943540845328688, + "loss": 0.9319, + "mean_token_accuracy": 0.7342008352279663, + "num_tokens": 7118411.0, + "step": 3080 + }, + { + "epoch": 0.028330429999083157, + "learning_rate": 0.00019433574768497295, + "loss": 0.9054, + "mean_token_accuracy": 0.7365982592105865, + "num_tokens": 7140666.0, + "step": 3090 + }, + { + "epoch": 0.02842211423856239, + "learning_rate": 0.00019431741083707712, + "loss": 0.9356, + "mean_token_accuracy": 0.7332864880561829, + "num_tokens": 7164803.0, + "step": 3100 + }, + { + "epoch": 0.028513798478041624, + "learning_rate": 0.00019429907398918128, + "loss": 0.9217, + "mean_token_accuracy": 0.7311400473117828, + "num_tokens": 7188525.0, + "step": 3110 + }, + { + "epoch": 0.028605482717520857, + "learning_rate": 0.00019428073714128542, + "loss": 0.9382, + "mean_token_accuracy": 0.7273888885974884, + "num_tokens": 7212173.0, + "step": 3120 + }, + { + "epoch": 0.028697166957000093, + "learning_rate": 0.00019426240029338959, + "loss": 0.8698, + "mean_token_accuracy": 0.7442355751991272, + "num_tokens": 7235299.0, + "step": 3130 + }, + { + "epoch": 0.028788851196479327, + "learning_rate": 0.00019424406344549372, + "loss": 0.9424, + "mean_token_accuracy": 0.7223499357700348, + "num_tokens": 7258654.0, + "step": 3140 + }, + { + "epoch": 0.02888053543595856, + "learning_rate": 0.0001942257265975979, + "loss": 0.9632, + "mean_token_accuracy": 0.7214014410972596, + "num_tokens": 7282501.0, + "step": 3150 + }, + { + "epoch": 0.028972219675437793, + "learning_rate": 0.00019420738974970203, + "loss": 0.965, + "mean_token_accuracy": 0.7162065744400025, + "num_tokens": 7304978.0, + "step": 3160 + }, + { + "epoch": 0.029063903914917026, + "learning_rate": 0.00019418905290180617, + "loss": 0.932, + "mean_token_accuracy": 0.7355128765106201, + "num_tokens": 7327854.0, + "step": 3170 + }, + { + "epoch": 0.02915558815439626, + "learning_rate": 0.00019417071605391036, + "loss": 0.9462, + "mean_token_accuracy": 0.7246469616889953, + "num_tokens": 7350491.0, + "step": 3180 + }, + { + "epoch": 0.029247272393875492, + "learning_rate": 0.0001941523792060145, + "loss": 0.954, + "mean_token_accuracy": 0.7225529968738555, + "num_tokens": 7374164.0, + "step": 3190 + }, + { + "epoch": 0.029338956633354726, + "learning_rate": 0.00019413404235811866, + "loss": 0.9212, + "mean_token_accuracy": 0.7264076113700867, + "num_tokens": 7396796.0, + "step": 3200 + }, + { + "epoch": 0.02943064087283396, + "learning_rate": 0.0001941157055102228, + "loss": 0.9442, + "mean_token_accuracy": 0.721256959438324, + "num_tokens": 7420750.0, + "step": 3210 + }, + { + "epoch": 0.029522325112313192, + "learning_rate": 0.00019409736866232694, + "loss": 0.9102, + "mean_token_accuracy": 0.7344326734542846, + "num_tokens": 7443504.0, + "step": 3220 + }, + { + "epoch": 0.029614009351792425, + "learning_rate": 0.0001940790318144311, + "loss": 0.9198, + "mean_token_accuracy": 0.7297407686710358, + "num_tokens": 7466958.0, + "step": 3230 + }, + { + "epoch": 0.029705693591271662, + "learning_rate": 0.00019406069496653527, + "loss": 0.921, + "mean_token_accuracy": 0.7294909179210662, + "num_tokens": 7490438.0, + "step": 3240 + }, + { + "epoch": 0.029797377830750895, + "learning_rate": 0.00019404235811863944, + "loss": 0.9084, + "mean_token_accuracy": 0.7329320967197418, + "num_tokens": 7512827.0, + "step": 3250 + }, + { + "epoch": 0.029889062070230128, + "learning_rate": 0.00019402402127074357, + "loss": 0.9329, + "mean_token_accuracy": 0.7312842011451721, + "num_tokens": 7536334.0, + "step": 3260 + }, + { + "epoch": 0.02998074630970936, + "learning_rate": 0.0001940056844228477, + "loss": 0.9365, + "mean_token_accuracy": 0.7257433235645294, + "num_tokens": 7559931.0, + "step": 3270 + }, + { + "epoch": 0.030072430549188595, + "learning_rate": 0.00019398734757495188, + "loss": 1.0004, + "mean_token_accuracy": 0.7128322720527649, + "num_tokens": 7584030.0, + "step": 3280 + }, + { + "epoch": 0.030164114788667828, + "learning_rate": 0.00019396901072705602, + "loss": 0.9296, + "mean_token_accuracy": 0.7273230791091919, + "num_tokens": 7606954.0, + "step": 3290 + }, + { + "epoch": 0.03025579902814706, + "learning_rate": 0.00019395067387916018, + "loss": 0.9096, + "mean_token_accuracy": 0.7309522807598114, + "num_tokens": 7630471.0, + "step": 3300 + }, + { + "epoch": 0.030347483267626294, + "learning_rate": 0.00019393233703126435, + "loss": 0.9365, + "mean_token_accuracy": 0.7274603307247162, + "num_tokens": 7654156.0, + "step": 3310 + }, + { + "epoch": 0.030439167507105527, + "learning_rate": 0.00019391400018336848, + "loss": 0.9204, + "mean_token_accuracy": 0.7304625988006592, + "num_tokens": 7676993.0, + "step": 3320 + }, + { + "epoch": 0.03053085174658476, + "learning_rate": 0.00019389566333547265, + "loss": 0.8979, + "mean_token_accuracy": 0.7398621261119842, + "num_tokens": 7700705.0, + "step": 3330 + }, + { + "epoch": 0.030622535986063997, + "learning_rate": 0.0001938773264875768, + "loss": 0.9062, + "mean_token_accuracy": 0.7303354918956757, + "num_tokens": 7723897.0, + "step": 3340 + }, + { + "epoch": 0.03071422022554323, + "learning_rate": 0.00019385898963968095, + "loss": 0.9335, + "mean_token_accuracy": 0.7265379667282105, + "num_tokens": 7747534.0, + "step": 3350 + }, + { + "epoch": 0.030805904465022464, + "learning_rate": 0.0001938406527917851, + "loss": 0.9404, + "mean_token_accuracy": 0.7280780255794526, + "num_tokens": 7770833.0, + "step": 3360 + }, + { + "epoch": 0.030897588704501697, + "learning_rate": 0.00019382231594388926, + "loss": 0.9224, + "mean_token_accuracy": 0.7308550953865052, + "num_tokens": 7794236.0, + "step": 3370 + }, + { + "epoch": 0.03098927294398093, + "learning_rate": 0.00019380397909599342, + "loss": 0.8752, + "mean_token_accuracy": 0.7406655371189117, + "num_tokens": 7817781.0, + "step": 3380 + }, + { + "epoch": 0.031080957183460163, + "learning_rate": 0.00019378564224809756, + "loss": 0.9681, + "mean_token_accuracy": 0.7218480706214905, + "num_tokens": 7840338.0, + "step": 3390 + }, + { + "epoch": 0.031172641422939396, + "learning_rate": 0.00019376730540020173, + "loss": 0.9164, + "mean_token_accuracy": 0.7277542173862457, + "num_tokens": 7862721.0, + "step": 3400 + }, + { + "epoch": 0.03126432566241863, + "learning_rate": 0.00019374896855230587, + "loss": 0.9116, + "mean_token_accuracy": 0.7325112044811248, + "num_tokens": 7885451.0, + "step": 3410 + }, + { + "epoch": 0.031356009901897866, + "learning_rate": 0.00019373063170441, + "loss": 0.9064, + "mean_token_accuracy": 0.7332186162471771, + "num_tokens": 7907812.0, + "step": 3420 + }, + { + "epoch": 0.031447694141377096, + "learning_rate": 0.00019371229485651417, + "loss": 0.9386, + "mean_token_accuracy": 0.7319149374961853, + "num_tokens": 7931090.0, + "step": 3430 + }, + { + "epoch": 0.03153937838085633, + "learning_rate": 0.00019369395800861833, + "loss": 0.962, + "mean_token_accuracy": 0.7256182253360748, + "num_tokens": 7953775.0, + "step": 3440 + }, + { + "epoch": 0.03163106262033556, + "learning_rate": 0.0001936756211607225, + "loss": 0.8555, + "mean_token_accuracy": 0.747320145368576, + "num_tokens": 7976398.0, + "step": 3450 + }, + { + "epoch": 0.0317227468598148, + "learning_rate": 0.00019365728431282664, + "loss": 0.9331, + "mean_token_accuracy": 0.7238705515861511, + "num_tokens": 8000784.0, + "step": 3460 + }, + { + "epoch": 0.03181443109929403, + "learning_rate": 0.00019363894746493078, + "loss": 0.9115, + "mean_token_accuracy": 0.7366018474102021, + "num_tokens": 8023750.0, + "step": 3470 + }, + { + "epoch": 0.031906115338773265, + "learning_rate": 0.00019362061061703494, + "loss": 0.9215, + "mean_token_accuracy": 0.7342450380325317, + "num_tokens": 8047137.0, + "step": 3480 + }, + { + "epoch": 0.0319977995782525, + "learning_rate": 0.00019360227376913908, + "loss": 0.9106, + "mean_token_accuracy": 0.728040623664856, + "num_tokens": 8069307.0, + "step": 3490 + }, + { + "epoch": 0.03208948381773173, + "learning_rate": 0.00019358393692124325, + "loss": 0.9269, + "mean_token_accuracy": 0.7291705071926117, + "num_tokens": 8092285.0, + "step": 3500 + }, + { + "epoch": 0.03218116805721097, + "learning_rate": 0.0001935656000733474, + "loss": 0.9263, + "mean_token_accuracy": 0.73028724193573, + "num_tokens": 8115420.0, + "step": 3510 + }, + { + "epoch": 0.0322728522966902, + "learning_rate": 0.00019354726322545155, + "loss": 0.9064, + "mean_token_accuracy": 0.7332595527172089, + "num_tokens": 8137777.0, + "step": 3520 + }, + { + "epoch": 0.032364536536169435, + "learning_rate": 0.00019352892637755571, + "loss": 0.8974, + "mean_token_accuracy": 0.7386172652244568, + "num_tokens": 8161065.0, + "step": 3530 + }, + { + "epoch": 0.032456220775648664, + "learning_rate": 0.00019351058952965985, + "loss": 0.8913, + "mean_token_accuracy": 0.7372443437576294, + "num_tokens": 8184175.0, + "step": 3540 + }, + { + "epoch": 0.0325479050151279, + "learning_rate": 0.00019349225268176402, + "loss": 0.9465, + "mean_token_accuracy": 0.7191249907016755, + "num_tokens": 8206748.0, + "step": 3550 + }, + { + "epoch": 0.03263958925460713, + "learning_rate": 0.00019347391583386816, + "loss": 0.9263, + "mean_token_accuracy": 0.7323255717754364, + "num_tokens": 8230621.0, + "step": 3560 + }, + { + "epoch": 0.03273127349408637, + "learning_rate": 0.00019345557898597232, + "loss": 0.9426, + "mean_token_accuracy": 0.7250443637371063, + "num_tokens": 8254704.0, + "step": 3570 + }, + { + "epoch": 0.0328229577335656, + "learning_rate": 0.0001934372421380765, + "loss": 0.8757, + "mean_token_accuracy": 0.7412980794906616, + "num_tokens": 8278789.0, + "step": 3580 + }, + { + "epoch": 0.032914641973044834, + "learning_rate": 0.00019341890529018063, + "loss": 0.9462, + "mean_token_accuracy": 0.7306847631931305, + "num_tokens": 8302665.0, + "step": 3590 + }, + { + "epoch": 0.03300632621252407, + "learning_rate": 0.0001934005684422848, + "loss": 0.9305, + "mean_token_accuracy": 0.7272827684879303, + "num_tokens": 8326571.0, + "step": 3600 + }, + { + "epoch": 0.0330980104520033, + "learning_rate": 0.00019338223159438893, + "loss": 0.9385, + "mean_token_accuracy": 0.728124612569809, + "num_tokens": 8349752.0, + "step": 3610 + }, + { + "epoch": 0.03318969469148254, + "learning_rate": 0.00019336389474649307, + "loss": 0.9288, + "mean_token_accuracy": 0.7261069536209106, + "num_tokens": 8373054.0, + "step": 3620 + }, + { + "epoch": 0.033281378930961766, + "learning_rate": 0.00019334555789859723, + "loss": 0.9452, + "mean_token_accuracy": 0.726563709974289, + "num_tokens": 8396409.0, + "step": 3630 + }, + { + "epoch": 0.033373063170441, + "learning_rate": 0.0001933272210507014, + "loss": 0.9343, + "mean_token_accuracy": 0.7256794333457947, + "num_tokens": 8419902.0, + "step": 3640 + }, + { + "epoch": 0.03346474740992023, + "learning_rate": 0.00019330888420280556, + "loss": 0.892, + "mean_token_accuracy": 0.7357638061046601, + "num_tokens": 8442209.0, + "step": 3650 + }, + { + "epoch": 0.03355643164939947, + "learning_rate": 0.0001932905473549097, + "loss": 0.9634, + "mean_token_accuracy": 0.7277958691120148, + "num_tokens": 8465645.0, + "step": 3660 + }, + { + "epoch": 0.0336481158888787, + "learning_rate": 0.00019327221050701384, + "loss": 0.9424, + "mean_token_accuracy": 0.7206253051757813, + "num_tokens": 8488580.0, + "step": 3670 + }, + { + "epoch": 0.033739800128357936, + "learning_rate": 0.000193253873659118, + "loss": 0.9341, + "mean_token_accuracy": 0.7325787842273712, + "num_tokens": 8512041.0, + "step": 3680 + }, + { + "epoch": 0.033831484367837165, + "learning_rate": 0.00019323553681122214, + "loss": 0.964, + "mean_token_accuracy": 0.7234341681003571, + "num_tokens": 8535048.0, + "step": 3690 + }, + { + "epoch": 0.0339231686073164, + "learning_rate": 0.0001932171999633263, + "loss": 0.9443, + "mean_token_accuracy": 0.7267716944217681, + "num_tokens": 8558636.0, + "step": 3700 + }, + { + "epoch": 0.03401485284679564, + "learning_rate": 0.00019319886311543048, + "loss": 0.9254, + "mean_token_accuracy": 0.7347033023834229, + "num_tokens": 8581147.0, + "step": 3710 + }, + { + "epoch": 0.03410653708627487, + "learning_rate": 0.00019318052626753461, + "loss": 0.8836, + "mean_token_accuracy": 0.7345532178878784, + "num_tokens": 8604458.0, + "step": 3720 + }, + { + "epoch": 0.034198221325754105, + "learning_rate": 0.00019316218941963878, + "loss": 0.8826, + "mean_token_accuracy": 0.7402276337146759, + "num_tokens": 8628067.0, + "step": 3730 + }, + { + "epoch": 0.034289905565233335, + "learning_rate": 0.00019314385257174292, + "loss": 0.9612, + "mean_token_accuracy": 0.7229425013065338, + "num_tokens": 8651721.0, + "step": 3740 + }, + { + "epoch": 0.03438158980471257, + "learning_rate": 0.00019312551572384708, + "loss": 0.9006, + "mean_token_accuracy": 0.7286960244178772, + "num_tokens": 8674637.0, + "step": 3750 + }, + { + "epoch": 0.0344732740441918, + "learning_rate": 0.00019310717887595122, + "loss": 0.9431, + "mean_token_accuracy": 0.7249775469303131, + "num_tokens": 8698077.0, + "step": 3760 + }, + { + "epoch": 0.03456495828367104, + "learning_rate": 0.0001930888420280554, + "loss": 0.9275, + "mean_token_accuracy": 0.729182767868042, + "num_tokens": 8720532.0, + "step": 3770 + }, + { + "epoch": 0.03465664252315027, + "learning_rate": 0.00019307050518015955, + "loss": 0.9447, + "mean_token_accuracy": 0.7250973403453826, + "num_tokens": 8744014.0, + "step": 3780 + }, + { + "epoch": 0.034748326762629504, + "learning_rate": 0.0001930521683322637, + "loss": 0.9265, + "mean_token_accuracy": 0.7238422811031342, + "num_tokens": 8766595.0, + "step": 3790 + }, + { + "epoch": 0.03484001100210874, + "learning_rate": 0.00019303383148436786, + "loss": 0.9248, + "mean_token_accuracy": 0.7350191116333008, + "num_tokens": 8790233.0, + "step": 3800 + }, + { + "epoch": 0.03493169524158797, + "learning_rate": 0.000193015494636472, + "loss": 0.95, + "mean_token_accuracy": 0.7251366436481476, + "num_tokens": 8813193.0, + "step": 3810 + }, + { + "epoch": 0.03502337948106721, + "learning_rate": 0.00019299715778857613, + "loss": 0.9388, + "mean_token_accuracy": 0.7282186210155487, + "num_tokens": 8835927.0, + "step": 3820 + }, + { + "epoch": 0.03511506372054644, + "learning_rate": 0.00019297882094068032, + "loss": 0.9124, + "mean_token_accuracy": 0.7330652952194214, + "num_tokens": 8859275.0, + "step": 3830 + }, + { + "epoch": 0.035206747960025674, + "learning_rate": 0.00019296048409278446, + "loss": 0.9275, + "mean_token_accuracy": 0.7347700655460357, + "num_tokens": 8883352.0, + "step": 3840 + }, + { + "epoch": 0.0352984321995049, + "learning_rate": 0.00019294214724488863, + "loss": 0.9137, + "mean_token_accuracy": 0.7327137053012848, + "num_tokens": 8906655.0, + "step": 3850 + }, + { + "epoch": 0.03539011643898414, + "learning_rate": 0.00019292381039699277, + "loss": 0.9246, + "mean_token_accuracy": 0.7234176814556121, + "num_tokens": 8929167.0, + "step": 3860 + }, + { + "epoch": 0.03548180067846337, + "learning_rate": 0.0001929054735490969, + "loss": 0.9326, + "mean_token_accuracy": 0.7283679842948914, + "num_tokens": 8952692.0, + "step": 3870 + }, + { + "epoch": 0.035573484917942606, + "learning_rate": 0.00019288713670120107, + "loss": 0.9383, + "mean_token_accuracy": 0.7266233503818512, + "num_tokens": 8976287.0, + "step": 3880 + }, + { + "epoch": 0.035665169157421836, + "learning_rate": 0.0001928687998533052, + "loss": 0.888, + "mean_token_accuracy": 0.7429258465766907, + "num_tokens": 9001139.0, + "step": 3890 + }, + { + "epoch": 0.03575685339690107, + "learning_rate": 0.00019285046300540937, + "loss": 0.9509, + "mean_token_accuracy": 0.7248917520046234, + "num_tokens": 9024293.0, + "step": 3900 + }, + { + "epoch": 0.03584853763638031, + "learning_rate": 0.00019283212615751354, + "loss": 0.8998, + "mean_token_accuracy": 0.7370175182819366, + "num_tokens": 9048108.0, + "step": 3910 + }, + { + "epoch": 0.03594022187585954, + "learning_rate": 0.00019281378930961768, + "loss": 0.9311, + "mean_token_accuracy": 0.7286861360073089, + "num_tokens": 9071283.0, + "step": 3920 + }, + { + "epoch": 0.036031906115338776, + "learning_rate": 0.00019279545246172184, + "loss": 0.8983, + "mean_token_accuracy": 0.7360428929328918, + "num_tokens": 9094154.0, + "step": 3930 + }, + { + "epoch": 0.036123590354818005, + "learning_rate": 0.00019277711561382598, + "loss": 0.9033, + "mean_token_accuracy": 0.7331046104431153, + "num_tokens": 9116850.0, + "step": 3940 + }, + { + "epoch": 0.03621527459429724, + "learning_rate": 0.00019275877876593015, + "loss": 0.9409, + "mean_token_accuracy": 0.7291643500328064, + "num_tokens": 9140874.0, + "step": 3950 + }, + { + "epoch": 0.03630695883377647, + "learning_rate": 0.0001927404419180343, + "loss": 0.9208, + "mean_token_accuracy": 0.7249537229537963, + "num_tokens": 9164480.0, + "step": 3960 + }, + { + "epoch": 0.03639864307325571, + "learning_rate": 0.00019272210507013845, + "loss": 0.9405, + "mean_token_accuracy": 0.7252800822257995, + "num_tokens": 9187966.0, + "step": 3970 + }, + { + "epoch": 0.03649032731273494, + "learning_rate": 0.00019270376822224262, + "loss": 0.9088, + "mean_token_accuracy": 0.7344141483306885, + "num_tokens": 9210424.0, + "step": 3980 + }, + { + "epoch": 0.036582011552214175, + "learning_rate": 0.00019268543137434675, + "loss": 0.9366, + "mean_token_accuracy": 0.7268620252609252, + "num_tokens": 9233443.0, + "step": 3990 + }, + { + "epoch": 0.036673695791693404, + "learning_rate": 0.00019266709452645092, + "loss": 0.9438, + "mean_token_accuracy": 0.7300260365009308, + "num_tokens": 9255951.0, + "step": 4000 + }, + { + "epoch": 0.03676538003117264, + "learning_rate": 0.00019264875767855506, + "loss": 0.906, + "mean_token_accuracy": 0.7370599687099457, + "num_tokens": 9279251.0, + "step": 4010 + }, + { + "epoch": 0.03685706427065188, + "learning_rate": 0.0001926304208306592, + "loss": 0.9123, + "mean_token_accuracy": 0.7281017899513245, + "num_tokens": 9303004.0, + "step": 4020 + }, + { + "epoch": 0.03694874851013111, + "learning_rate": 0.0001926120839827634, + "loss": 0.9501, + "mean_token_accuracy": 0.7276595234870911, + "num_tokens": 9325422.0, + "step": 4030 + }, + { + "epoch": 0.037040432749610344, + "learning_rate": 0.00019259374713486753, + "loss": 0.9224, + "mean_token_accuracy": 0.7300042688846589, + "num_tokens": 9348725.0, + "step": 4040 + }, + { + "epoch": 0.037132116989089574, + "learning_rate": 0.0001925754102869717, + "loss": 0.9135, + "mean_token_accuracy": 0.7325215935707092, + "num_tokens": 9372069.0, + "step": 4050 + }, + { + "epoch": 0.03722380122856881, + "learning_rate": 0.00019255707343907583, + "loss": 0.9213, + "mean_token_accuracy": 0.7293917417526246, + "num_tokens": 9394823.0, + "step": 4060 + }, + { + "epoch": 0.03731548546804804, + "learning_rate": 0.00019253873659117997, + "loss": 0.8938, + "mean_token_accuracy": 0.7401670753955841, + "num_tokens": 9417990.0, + "step": 4070 + }, + { + "epoch": 0.03740716970752728, + "learning_rate": 0.00019252039974328414, + "loss": 0.9218, + "mean_token_accuracy": 0.7370520889759063, + "num_tokens": 9441655.0, + "step": 4080 + }, + { + "epoch": 0.03749885394700651, + "learning_rate": 0.0001925020628953883, + "loss": 0.9203, + "mean_token_accuracy": 0.7329012930393219, + "num_tokens": 9464852.0, + "step": 4090 + }, + { + "epoch": 0.03759053818648574, + "learning_rate": 0.00019248372604749244, + "loss": 0.9245, + "mean_token_accuracy": 0.7307345628738403, + "num_tokens": 9488579.0, + "step": 4100 + }, + { + "epoch": 0.03768222242596498, + "learning_rate": 0.0001924653891995966, + "loss": 0.9244, + "mean_token_accuracy": 0.7316778898239136, + "num_tokens": 9512651.0, + "step": 4110 + }, + { + "epoch": 0.03777390666544421, + "learning_rate": 0.00019244705235170074, + "loss": 0.9031, + "mean_token_accuracy": 0.7334048569202423, + "num_tokens": 9535376.0, + "step": 4120 + }, + { + "epoch": 0.037865590904923446, + "learning_rate": 0.0001924287155038049, + "loss": 0.9133, + "mean_token_accuracy": 0.7282979667186738, + "num_tokens": 9558779.0, + "step": 4130 + }, + { + "epoch": 0.037957275144402676, + "learning_rate": 0.00019241037865590905, + "loss": 0.9576, + "mean_token_accuracy": 0.7185169041156769, + "num_tokens": 9581924.0, + "step": 4140 + }, + { + "epoch": 0.03804895938388191, + "learning_rate": 0.0001923920418080132, + "loss": 0.8996, + "mean_token_accuracy": 0.7348777174949646, + "num_tokens": 9604941.0, + "step": 4150 + }, + { + "epoch": 0.03814064362336114, + "learning_rate": 0.00019237370496011738, + "loss": 0.9546, + "mean_token_accuracy": 0.7209603607654571, + "num_tokens": 9628525.0, + "step": 4160 + }, + { + "epoch": 0.03823232786284038, + "learning_rate": 0.00019235536811222152, + "loss": 0.9247, + "mean_token_accuracy": 0.7281001746654511, + "num_tokens": 9652060.0, + "step": 4170 + }, + { + "epoch": 0.03832401210231961, + "learning_rate": 0.00019233703126432568, + "loss": 0.9508, + "mean_token_accuracy": 0.7243199825286866, + "num_tokens": 9674742.0, + "step": 4180 + }, + { + "epoch": 0.038415696341798845, + "learning_rate": 0.00019231869441642982, + "loss": 0.903, + "mean_token_accuracy": 0.7305576920509338, + "num_tokens": 9698353.0, + "step": 4190 + }, + { + "epoch": 0.038507380581278075, + "learning_rate": 0.00019230035756853398, + "loss": 0.8963, + "mean_token_accuracy": 0.7371667623519897, + "num_tokens": 9720928.0, + "step": 4200 + }, + { + "epoch": 0.03859906482075731, + "learning_rate": 0.00019228202072063812, + "loss": 0.9727, + "mean_token_accuracy": 0.7168154358863831, + "num_tokens": 9743613.0, + "step": 4210 + }, + { + "epoch": 0.03869074906023655, + "learning_rate": 0.0001922636838727423, + "loss": 0.8997, + "mean_token_accuracy": 0.7314011812210083, + "num_tokens": 9766340.0, + "step": 4220 + }, + { + "epoch": 0.03878243329971578, + "learning_rate": 0.00019224534702484645, + "loss": 0.9387, + "mean_token_accuracy": 0.7212896049022675, + "num_tokens": 9789134.0, + "step": 4230 + }, + { + "epoch": 0.038874117539195015, + "learning_rate": 0.0001922270101769506, + "loss": 0.9679, + "mean_token_accuracy": 0.7234770894050598, + "num_tokens": 9812019.0, + "step": 4240 + }, + { + "epoch": 0.038965801778674244, + "learning_rate": 0.00019220867332905476, + "loss": 0.9112, + "mean_token_accuracy": 0.7349667072296142, + "num_tokens": 9835484.0, + "step": 4250 + }, + { + "epoch": 0.03905748601815348, + "learning_rate": 0.0001921903364811589, + "loss": 0.906, + "mean_token_accuracy": 0.7317733287811279, + "num_tokens": 9858660.0, + "step": 4260 + }, + { + "epoch": 0.03914917025763271, + "learning_rate": 0.00019217199963326303, + "loss": 0.9464, + "mean_token_accuracy": 0.7197532892227173, + "num_tokens": 9881340.0, + "step": 4270 + }, + { + "epoch": 0.03924085449711195, + "learning_rate": 0.0001921536627853672, + "loss": 0.8831, + "mean_token_accuracy": 0.7415769517421722, + "num_tokens": 9904520.0, + "step": 4280 + }, + { + "epoch": 0.03933253873659118, + "learning_rate": 0.00019213532593747136, + "loss": 0.9393, + "mean_token_accuracy": 0.7288309633731842, + "num_tokens": 9927905.0, + "step": 4290 + }, + { + "epoch": 0.039424222976070414, + "learning_rate": 0.0001921169890895755, + "loss": 0.9101, + "mean_token_accuracy": 0.7318473041057587, + "num_tokens": 9951267.0, + "step": 4300 + }, + { + "epoch": 0.03951590721554965, + "learning_rate": 0.00019209865224167967, + "loss": 0.9621, + "mean_token_accuracy": 0.724247795343399, + "num_tokens": 9974399.0, + "step": 4310 + }, + { + "epoch": 0.03960759145502888, + "learning_rate": 0.0001920803153937838, + "loss": 0.9643, + "mean_token_accuracy": 0.7237609922885895, + "num_tokens": 9998102.0, + "step": 4320 + }, + { + "epoch": 0.03969927569450812, + "learning_rate": 0.00019206197854588797, + "loss": 0.9104, + "mean_token_accuracy": 0.7343532621860505, + "num_tokens": 10020895.0, + "step": 4330 + }, + { + "epoch": 0.03979095993398735, + "learning_rate": 0.0001920436416979921, + "loss": 0.9486, + "mean_token_accuracy": 0.7267881989479065, + "num_tokens": 10044334.0, + "step": 4340 + }, + { + "epoch": 0.03988264417346658, + "learning_rate": 0.00019202530485009628, + "loss": 0.9248, + "mean_token_accuracy": 0.732563316822052, + "num_tokens": 10067261.0, + "step": 4350 + }, + { + "epoch": 0.03997432841294581, + "learning_rate": 0.00019200696800220044, + "loss": 0.9232, + "mean_token_accuracy": 0.729229062795639, + "num_tokens": 10091244.0, + "step": 4360 + }, + { + "epoch": 0.04006601265242505, + "learning_rate": 0.00019198863115430458, + "loss": 0.9276, + "mean_token_accuracy": 0.7269666433334351, + "num_tokens": 10114219.0, + "step": 4370 + }, + { + "epoch": 0.04015769689190428, + "learning_rate": 0.00019197029430640875, + "loss": 0.9053, + "mean_token_accuracy": 0.7333428621292114, + "num_tokens": 10136903.0, + "step": 4380 + }, + { + "epoch": 0.040249381131383516, + "learning_rate": 0.00019195195745851288, + "loss": 0.8858, + "mean_token_accuracy": 0.7340048730373383, + "num_tokens": 10159936.0, + "step": 4390 + }, + { + "epoch": 0.040341065370862746, + "learning_rate": 0.00019193362061061705, + "loss": 0.9274, + "mean_token_accuracy": 0.7230561375617981, + "num_tokens": 10182391.0, + "step": 4400 + }, + { + "epoch": 0.04043274961034198, + "learning_rate": 0.0001919152837627212, + "loss": 0.9443, + "mean_token_accuracy": 0.7281116962432861, + "num_tokens": 10204517.0, + "step": 4410 + }, + { + "epoch": 0.04052443384982122, + "learning_rate": 0.00019189694691482535, + "loss": 0.9196, + "mean_token_accuracy": 0.7343146979808808, + "num_tokens": 10228254.0, + "step": 4420 + }, + { + "epoch": 0.04061611808930045, + "learning_rate": 0.00019187861006692952, + "loss": 0.925, + "mean_token_accuracy": 0.7307032346725464, + "num_tokens": 10251253.0, + "step": 4430 + }, + { + "epoch": 0.040707802328779685, + "learning_rate": 0.00019186027321903366, + "loss": 0.9239, + "mean_token_accuracy": 0.7301364064216613, + "num_tokens": 10274680.0, + "step": 4440 + }, + { + "epoch": 0.040799486568258915, + "learning_rate": 0.00019184193637113782, + "loss": 0.9009, + "mean_token_accuracy": 0.7370919942855835, + "num_tokens": 10297380.0, + "step": 4450 + }, + { + "epoch": 0.04089117080773815, + "learning_rate": 0.00019182359952324196, + "loss": 0.9127, + "mean_token_accuracy": 0.7353456616401672, + "num_tokens": 10320125.0, + "step": 4460 + }, + { + "epoch": 0.04098285504721738, + "learning_rate": 0.0001918052626753461, + "loss": 0.9246, + "mean_token_accuracy": 0.727199786901474, + "num_tokens": 10342990.0, + "step": 4470 + }, + { + "epoch": 0.04107453928669662, + "learning_rate": 0.0001917869258274503, + "loss": 0.9192, + "mean_token_accuracy": 0.7290555357933044, + "num_tokens": 10367321.0, + "step": 4480 + }, + { + "epoch": 0.04116622352617585, + "learning_rate": 0.00019176858897955443, + "loss": 0.9051, + "mean_token_accuracy": 0.7330770313739776, + "num_tokens": 10390203.0, + "step": 4490 + }, + { + "epoch": 0.041257907765655084, + "learning_rate": 0.00019175025213165857, + "loss": 0.8645, + "mean_token_accuracy": 0.7316236853599548, + "num_tokens": 10413697.0, + "step": 4500 + }, + { + "epoch": 0.041349592005134314, + "learning_rate": 0.00019173191528376273, + "loss": 0.9472, + "mean_token_accuracy": 0.7224329710006714, + "num_tokens": 10437138.0, + "step": 4510 + }, + { + "epoch": 0.04144127624461355, + "learning_rate": 0.00019171357843586687, + "loss": 0.9147, + "mean_token_accuracy": 0.7303707957267761, + "num_tokens": 10460102.0, + "step": 4520 + }, + { + "epoch": 0.04153296048409279, + "learning_rate": 0.00019169524158797104, + "loss": 0.9283, + "mean_token_accuracy": 0.7304834306240082, + "num_tokens": 10483933.0, + "step": 4530 + }, + { + "epoch": 0.04162464472357202, + "learning_rate": 0.00019167690474007518, + "loss": 0.9127, + "mean_token_accuracy": 0.7311757445335388, + "num_tokens": 10507204.0, + "step": 4540 + }, + { + "epoch": 0.041716328963051254, + "learning_rate": 0.00019165856789217934, + "loss": 0.9085, + "mean_token_accuracy": 0.7350265562534333, + "num_tokens": 10530801.0, + "step": 4550 + }, + { + "epoch": 0.041808013202530483, + "learning_rate": 0.0001916402310442835, + "loss": 0.8878, + "mean_token_accuracy": 0.7378389596939087, + "num_tokens": 10553989.0, + "step": 4560 + }, + { + "epoch": 0.04189969744200972, + "learning_rate": 0.00019162189419638764, + "loss": 0.884, + "mean_token_accuracy": 0.734668105840683, + "num_tokens": 10577138.0, + "step": 4570 + }, + { + "epoch": 0.04199138168148895, + "learning_rate": 0.0001916035573484918, + "loss": 0.8842, + "mean_token_accuracy": 0.7381771743297577, + "num_tokens": 10601297.0, + "step": 4580 + }, + { + "epoch": 0.042083065920968186, + "learning_rate": 0.00019158522050059595, + "loss": 0.9061, + "mean_token_accuracy": 0.7319147646427154, + "num_tokens": 10624206.0, + "step": 4590 + }, + { + "epoch": 0.042174750160447416, + "learning_rate": 0.0001915668836527001, + "loss": 0.8852, + "mean_token_accuracy": 0.7353412926197052, + "num_tokens": 10648182.0, + "step": 4600 + }, + { + "epoch": 0.04226643439992665, + "learning_rate": 0.00019154854680480428, + "loss": 0.9555, + "mean_token_accuracy": 0.7207437753677368, + "num_tokens": 10670133.0, + "step": 4610 + }, + { + "epoch": 0.04235811863940589, + "learning_rate": 0.00019153020995690842, + "loss": 0.9053, + "mean_token_accuracy": 0.7397615969181061, + "num_tokens": 10693264.0, + "step": 4620 + }, + { + "epoch": 0.04244980287888512, + "learning_rate": 0.00019151187310901258, + "loss": 0.9227, + "mean_token_accuracy": 0.7346453845500946, + "num_tokens": 10715885.0, + "step": 4630 + }, + { + "epoch": 0.042541487118364356, + "learning_rate": 0.00019149353626111672, + "loss": 0.8899, + "mean_token_accuracy": 0.7341054856777192, + "num_tokens": 10739445.0, + "step": 4640 + }, + { + "epoch": 0.042633171357843586, + "learning_rate": 0.00019147519941322089, + "loss": 0.9314, + "mean_token_accuracy": 0.7296093761920929, + "num_tokens": 10761786.0, + "step": 4650 + }, + { + "epoch": 0.04272485559732282, + "learning_rate": 0.00019145686256532502, + "loss": 0.9078, + "mean_token_accuracy": 0.7359691679477691, + "num_tokens": 10784647.0, + "step": 4660 + }, + { + "epoch": 0.04281653983680205, + "learning_rate": 0.00019143852571742916, + "loss": 0.9195, + "mean_token_accuracy": 0.7348001301288605, + "num_tokens": 10808385.0, + "step": 4670 + }, + { + "epoch": 0.04290822407628129, + "learning_rate": 0.00019142018886953336, + "loss": 0.8954, + "mean_token_accuracy": 0.7353730797767639, + "num_tokens": 10831964.0, + "step": 4680 + }, + { + "epoch": 0.04299990831576052, + "learning_rate": 0.0001914018520216375, + "loss": 0.9343, + "mean_token_accuracy": 0.7262511432170868, + "num_tokens": 10855313.0, + "step": 4690 + }, + { + "epoch": 0.043091592555239755, + "learning_rate": 0.00019138351517374163, + "loss": 0.9107, + "mean_token_accuracy": 0.7381054639816285, + "num_tokens": 10878614.0, + "step": 4700 + }, + { + "epoch": 0.043183276794718985, + "learning_rate": 0.0001913651783258458, + "loss": 0.9033, + "mean_token_accuracy": 0.7366665303707123, + "num_tokens": 10901215.0, + "step": 4710 + }, + { + "epoch": 0.04327496103419822, + "learning_rate": 0.00019134684147794994, + "loss": 0.9308, + "mean_token_accuracy": 0.7277913689613342, + "num_tokens": 10923953.0, + "step": 4720 + }, + { + "epoch": 0.04336664527367746, + "learning_rate": 0.0001913285046300541, + "loss": 0.9264, + "mean_token_accuracy": 0.7296841561794281, + "num_tokens": 10947865.0, + "step": 4730 + }, + { + "epoch": 0.04345832951315669, + "learning_rate": 0.00019131016778215827, + "loss": 0.8988, + "mean_token_accuracy": 0.7380661249160767, + "num_tokens": 10970854.0, + "step": 4740 + }, + { + "epoch": 0.043550013752635924, + "learning_rate": 0.0001912918309342624, + "loss": 0.9156, + "mean_token_accuracy": 0.7335442006587982, + "num_tokens": 10994578.0, + "step": 4750 + }, + { + "epoch": 0.043641697992115154, + "learning_rate": 0.00019127349408636657, + "loss": 0.9366, + "mean_token_accuracy": 0.7311666131019592, + "num_tokens": 11018190.0, + "step": 4760 + }, + { + "epoch": 0.04373338223159439, + "learning_rate": 0.0001912551572384707, + "loss": 0.8864, + "mean_token_accuracy": 0.7349504888057709, + "num_tokens": 11040756.0, + "step": 4770 + }, + { + "epoch": 0.04382506647107362, + "learning_rate": 0.00019123682039057487, + "loss": 0.9226, + "mean_token_accuracy": 0.7343326091766358, + "num_tokens": 11064224.0, + "step": 4780 + }, + { + "epoch": 0.04391675071055286, + "learning_rate": 0.000191218483542679, + "loss": 0.9116, + "mean_token_accuracy": 0.7310377061367035, + "num_tokens": 11088507.0, + "step": 4790 + }, + { + "epoch": 0.04400843495003209, + "learning_rate": 0.00019120014669478318, + "loss": 0.9202, + "mean_token_accuracy": 0.7256883978843689, + "num_tokens": 11111192.0, + "step": 4800 + }, + { + "epoch": 0.04410011918951132, + "learning_rate": 0.00019118180984688734, + "loss": 0.9189, + "mean_token_accuracy": 0.737100613117218, + "num_tokens": 11134725.0, + "step": 4810 + }, + { + "epoch": 0.04419180342899055, + "learning_rate": 0.00019116347299899148, + "loss": 0.9303, + "mean_token_accuracy": 0.7256133377552032, + "num_tokens": 11158174.0, + "step": 4820 + }, + { + "epoch": 0.04428348766846979, + "learning_rate": 0.00019114513615109565, + "loss": 0.8911, + "mean_token_accuracy": 0.7342537999153137, + "num_tokens": 11181872.0, + "step": 4830 + }, + { + "epoch": 0.044375171907949026, + "learning_rate": 0.00019112679930319979, + "loss": 0.8922, + "mean_token_accuracy": 0.7380224943161011, + "num_tokens": 11205167.0, + "step": 4840 + }, + { + "epoch": 0.044466856147428256, + "learning_rate": 0.00019110846245530395, + "loss": 0.9255, + "mean_token_accuracy": 0.7311283588409424, + "num_tokens": 11228416.0, + "step": 4850 + }, + { + "epoch": 0.04455854038690749, + "learning_rate": 0.0001910901256074081, + "loss": 0.8655, + "mean_token_accuracy": 0.7448768377304077, + "num_tokens": 11252013.0, + "step": 4860 + }, + { + "epoch": 0.04465022462638672, + "learning_rate": 0.00019107178875951223, + "loss": 0.9079, + "mean_token_accuracy": 0.7323541164398193, + "num_tokens": 11275455.0, + "step": 4870 + }, + { + "epoch": 0.04474190886586596, + "learning_rate": 0.00019105345191161642, + "loss": 0.8912, + "mean_token_accuracy": 0.7325319647789001, + "num_tokens": 11298923.0, + "step": 4880 + }, + { + "epoch": 0.04483359310534519, + "learning_rate": 0.00019103511506372056, + "loss": 0.8714, + "mean_token_accuracy": 0.7456724584102631, + "num_tokens": 11321675.0, + "step": 4890 + }, + { + "epoch": 0.044925277344824426, + "learning_rate": 0.0001910167782158247, + "loss": 0.8966, + "mean_token_accuracy": 0.732540625333786, + "num_tokens": 11344222.0, + "step": 4900 + }, + { + "epoch": 0.045016961584303655, + "learning_rate": 0.00019099844136792886, + "loss": 0.9664, + "mean_token_accuracy": 0.7202228009700775, + "num_tokens": 11367101.0, + "step": 4910 + }, + { + "epoch": 0.04510864582378289, + "learning_rate": 0.000190980104520033, + "loss": 0.9181, + "mean_token_accuracy": 0.7350785553455352, + "num_tokens": 11390164.0, + "step": 4920 + }, + { + "epoch": 0.04520033006326213, + "learning_rate": 0.00019096176767213717, + "loss": 0.8982, + "mean_token_accuracy": 0.7460702061653137, + "num_tokens": 11413866.0, + "step": 4930 + }, + { + "epoch": 0.04529201430274136, + "learning_rate": 0.00019094343082424133, + "loss": 0.9133, + "mean_token_accuracy": 0.7296039283275604, + "num_tokens": 11437073.0, + "step": 4940 + }, + { + "epoch": 0.045383698542220595, + "learning_rate": 0.00019092509397634547, + "loss": 0.9185, + "mean_token_accuracy": 0.7308907270431518, + "num_tokens": 11460639.0, + "step": 4950 + }, + { + "epoch": 0.045475382781699825, + "learning_rate": 0.00019090675712844963, + "loss": 0.9383, + "mean_token_accuracy": 0.7259656071662903, + "num_tokens": 11484530.0, + "step": 4960 + }, + { + "epoch": 0.04556706702117906, + "learning_rate": 0.00019088842028055377, + "loss": 0.909, + "mean_token_accuracy": 0.7335390865802764, + "num_tokens": 11508137.0, + "step": 4970 + }, + { + "epoch": 0.04565875126065829, + "learning_rate": 0.00019087008343265794, + "loss": 0.8711, + "mean_token_accuracy": 0.740622091293335, + "num_tokens": 11531716.0, + "step": 4980 + }, + { + "epoch": 0.04575043550013753, + "learning_rate": 0.00019085174658476208, + "loss": 0.8933, + "mean_token_accuracy": 0.7343130946159363, + "num_tokens": 11554888.0, + "step": 4990 + }, + { + "epoch": 0.04584211973961676, + "learning_rate": 0.00019083340973686624, + "loss": 0.8836, + "mean_token_accuracy": 0.7344820499420166, + "num_tokens": 11578097.0, + "step": 5000 + }, + { + "epoch": 0.045933803979095994, + "learning_rate": 0.0001908150728889704, + "loss": 0.9201, + "mean_token_accuracy": 0.7351269721984863, + "num_tokens": 11601339.0, + "step": 5010 + }, + { + "epoch": 0.046025488218575224, + "learning_rate": 0.00019079673604107455, + "loss": 0.8898, + "mean_token_accuracy": 0.7382785975933075, + "num_tokens": 11623472.0, + "step": 5020 + }, + { + "epoch": 0.04611717245805446, + "learning_rate": 0.0001907783991931787, + "loss": 0.9112, + "mean_token_accuracy": 0.7351314783096313, + "num_tokens": 11645914.0, + "step": 5030 + }, + { + "epoch": 0.0462088566975337, + "learning_rate": 0.00019076006234528285, + "loss": 0.8596, + "mean_token_accuracy": 0.7480172634124755, + "num_tokens": 11669016.0, + "step": 5040 + }, + { + "epoch": 0.04630054093701293, + "learning_rate": 0.00019074172549738702, + "loss": 0.9295, + "mean_token_accuracy": 0.7314546644687653, + "num_tokens": 11692104.0, + "step": 5050 + }, + { + "epoch": 0.04639222517649216, + "learning_rate": 0.00019072338864949115, + "loss": 0.9463, + "mean_token_accuracy": 0.7246203124523163, + "num_tokens": 11715266.0, + "step": 5060 + }, + { + "epoch": 0.04648390941597139, + "learning_rate": 0.00019070505180159532, + "loss": 0.941, + "mean_token_accuracy": 0.7293759286403656, + "num_tokens": 11738485.0, + "step": 5070 + }, + { + "epoch": 0.04657559365545063, + "learning_rate": 0.00019068671495369948, + "loss": 0.9232, + "mean_token_accuracy": 0.7281923830509186, + "num_tokens": 11762529.0, + "step": 5080 + }, + { + "epoch": 0.04666727789492986, + "learning_rate": 0.00019066837810580362, + "loss": 0.8803, + "mean_token_accuracy": 0.735435402393341, + "num_tokens": 11784620.0, + "step": 5090 + }, + { + "epoch": 0.046758962134409096, + "learning_rate": 0.00019065004125790776, + "loss": 0.9113, + "mean_token_accuracy": 0.7347549855709076, + "num_tokens": 11807447.0, + "step": 5100 + }, + { + "epoch": 0.046850646373888326, + "learning_rate": 0.00019063170441001193, + "loss": 0.8987, + "mean_token_accuracy": 0.7351148843765258, + "num_tokens": 11830174.0, + "step": 5110 + }, + { + "epoch": 0.04694233061336756, + "learning_rate": 0.00019061336756211606, + "loss": 0.9323, + "mean_token_accuracy": 0.7337264120578766, + "num_tokens": 11852919.0, + "step": 5120 + }, + { + "epoch": 0.04703401485284679, + "learning_rate": 0.00019059503071422023, + "loss": 0.917, + "mean_token_accuracy": 0.7345613598823547, + "num_tokens": 11875515.0, + "step": 5130 + }, + { + "epoch": 0.04712569909232603, + "learning_rate": 0.0001905766938663244, + "loss": 0.9532, + "mean_token_accuracy": 0.7227387726306915, + "num_tokens": 11898333.0, + "step": 5140 + }, + { + "epoch": 0.047217383331805265, + "learning_rate": 0.00019055835701842853, + "loss": 0.9127, + "mean_token_accuracy": 0.7374009609222412, + "num_tokens": 11921640.0, + "step": 5150 + }, + { + "epoch": 0.047309067571284495, + "learning_rate": 0.0001905400201705327, + "loss": 0.9097, + "mean_token_accuracy": 0.7349705874919892, + "num_tokens": 11945069.0, + "step": 5160 + }, + { + "epoch": 0.04740075181076373, + "learning_rate": 0.00019052168332263684, + "loss": 0.904, + "mean_token_accuracy": 0.7365436136722565, + "num_tokens": 11968865.0, + "step": 5170 + }, + { + "epoch": 0.04749243605024296, + "learning_rate": 0.000190503346474741, + "loss": 0.9122, + "mean_token_accuracy": 0.7329197347164154, + "num_tokens": 11991891.0, + "step": 5180 + }, + { + "epoch": 0.0475841202897222, + "learning_rate": 0.00019048500962684514, + "loss": 0.8986, + "mean_token_accuracy": 0.7397706091403962, + "num_tokens": 12014467.0, + "step": 5190 + }, + { + "epoch": 0.04767580452920143, + "learning_rate": 0.0001904666727789493, + "loss": 0.8919, + "mean_token_accuracy": 0.7435442924499511, + "num_tokens": 12037783.0, + "step": 5200 + }, + { + "epoch": 0.047767488768680665, + "learning_rate": 0.00019044833593105347, + "loss": 0.8918, + "mean_token_accuracy": 0.7346071600914001, + "num_tokens": 12060304.0, + "step": 5210 + }, + { + "epoch": 0.047859173008159894, + "learning_rate": 0.0001904299990831576, + "loss": 0.9051, + "mean_token_accuracy": 0.7371912002563477, + "num_tokens": 12083174.0, + "step": 5220 + }, + { + "epoch": 0.04795085724763913, + "learning_rate": 0.00019041166223526178, + "loss": 0.8998, + "mean_token_accuracy": 0.7349052250385284, + "num_tokens": 12106308.0, + "step": 5230 + }, + { + "epoch": 0.04804254148711837, + "learning_rate": 0.00019039332538736591, + "loss": 0.9604, + "mean_token_accuracy": 0.7219788312911988, + "num_tokens": 12129160.0, + "step": 5240 + }, + { + "epoch": 0.0481342257265976, + "learning_rate": 0.00019037498853947008, + "loss": 0.9377, + "mean_token_accuracy": 0.7283720731735229, + "num_tokens": 12152124.0, + "step": 5250 + }, + { + "epoch": 0.048225909966076834, + "learning_rate": 0.00019035665169157422, + "loss": 0.945, + "mean_token_accuracy": 0.7313692808151245, + "num_tokens": 12175087.0, + "step": 5260 + }, + { + "epoch": 0.048317594205556064, + "learning_rate": 0.00019033831484367838, + "loss": 0.909, + "mean_token_accuracy": 0.7319585144519806, + "num_tokens": 12197643.0, + "step": 5270 + }, + { + "epoch": 0.0484092784450353, + "learning_rate": 0.00019031997799578255, + "loss": 0.9346, + "mean_token_accuracy": 0.7274428248405457, + "num_tokens": 12220518.0, + "step": 5280 + }, + { + "epoch": 0.04850096268451453, + "learning_rate": 0.0001903016411478867, + "loss": 0.8683, + "mean_token_accuracy": 0.745925348997116, + "num_tokens": 12244221.0, + "step": 5290 + }, + { + "epoch": 0.04859264692399377, + "learning_rate": 0.00019028330429999083, + "loss": 0.9096, + "mean_token_accuracy": 0.7328312158584595, + "num_tokens": 12267036.0, + "step": 5300 + }, + { + "epoch": 0.048684331163472996, + "learning_rate": 0.000190264967452095, + "loss": 0.9198, + "mean_token_accuracy": 0.7322596430778503, + "num_tokens": 12290136.0, + "step": 5310 + }, + { + "epoch": 0.04877601540295223, + "learning_rate": 0.00019024663060419913, + "loss": 0.8922, + "mean_token_accuracy": 0.7314849436283112, + "num_tokens": 12312714.0, + "step": 5320 + }, + { + "epoch": 0.04886769964243146, + "learning_rate": 0.00019022829375630332, + "loss": 0.8543, + "mean_token_accuracy": 0.7430943608283996, + "num_tokens": 12336333.0, + "step": 5330 + }, + { + "epoch": 0.0489593838819107, + "learning_rate": 0.00019020995690840746, + "loss": 0.8905, + "mean_token_accuracy": 0.7302204668521881, + "num_tokens": 12358377.0, + "step": 5340 + }, + { + "epoch": 0.049051068121389936, + "learning_rate": 0.0001901916200605116, + "loss": 0.918, + "mean_token_accuracy": 0.7341718196868896, + "num_tokens": 12381783.0, + "step": 5350 + }, + { + "epoch": 0.049142752360869166, + "learning_rate": 0.00019017328321261576, + "loss": 0.8849, + "mean_token_accuracy": 0.7394325435161591, + "num_tokens": 12404907.0, + "step": 5360 + }, + { + "epoch": 0.0492344366003484, + "learning_rate": 0.0001901549463647199, + "loss": 0.9342, + "mean_token_accuracy": 0.7280310750007629, + "num_tokens": 12428138.0, + "step": 5370 + }, + { + "epoch": 0.04932612083982763, + "learning_rate": 0.00019013660951682407, + "loss": 0.9071, + "mean_token_accuracy": 0.7335152506828309, + "num_tokens": 12452551.0, + "step": 5380 + }, + { + "epoch": 0.04941780507930687, + "learning_rate": 0.0001901182726689282, + "loss": 0.8968, + "mean_token_accuracy": 0.7261455655097961, + "num_tokens": 12476343.0, + "step": 5390 + }, + { + "epoch": 0.0495094893187861, + "learning_rate": 0.00019009993582103237, + "loss": 0.9005, + "mean_token_accuracy": 0.7367361962795258, + "num_tokens": 12499385.0, + "step": 5400 + }, + { + "epoch": 0.049601173558265335, + "learning_rate": 0.00019008159897313654, + "loss": 0.9273, + "mean_token_accuracy": 0.7294711172580719, + "num_tokens": 12523284.0, + "step": 5410 + }, + { + "epoch": 0.049692857797744565, + "learning_rate": 0.00019006326212524067, + "loss": 0.9013, + "mean_token_accuracy": 0.7319343149662018, + "num_tokens": 12547085.0, + "step": 5420 + }, + { + "epoch": 0.0497845420372238, + "learning_rate": 0.00019004492527734484, + "loss": 0.8736, + "mean_token_accuracy": 0.7341129004955291, + "num_tokens": 12569829.0, + "step": 5430 + }, + { + "epoch": 0.04987622627670304, + "learning_rate": 0.00019002658842944898, + "loss": 0.9254, + "mean_token_accuracy": 0.7253397226333618, + "num_tokens": 12592456.0, + "step": 5440 + }, + { + "epoch": 0.04996791051618227, + "learning_rate": 0.00019000825158155314, + "loss": 0.9164, + "mean_token_accuracy": 0.733900386095047, + "num_tokens": 12614992.0, + "step": 5450 + }, + { + "epoch": 0.050059594755661505, + "learning_rate": 0.0001899899147336573, + "loss": 0.8818, + "mean_token_accuracy": 0.7450060486793518, + "num_tokens": 12638048.0, + "step": 5460 + }, + { + "epoch": 0.050151278995140734, + "learning_rate": 0.00018997157788576145, + "loss": 0.9016, + "mean_token_accuracy": 0.7367283046245575, + "num_tokens": 12661835.0, + "step": 5470 + }, + { + "epoch": 0.05024296323461997, + "learning_rate": 0.0001899532410378656, + "loss": 0.9191, + "mean_token_accuracy": 0.7345572352409363, + "num_tokens": 12685048.0, + "step": 5480 + }, + { + "epoch": 0.0503346474740992, + "learning_rate": 0.00018993490418996975, + "loss": 0.8806, + "mean_token_accuracy": 0.7392894685268402, + "num_tokens": 12708402.0, + "step": 5490 + }, + { + "epoch": 0.05042633171357844, + "learning_rate": 0.0001899165673420739, + "loss": 0.9381, + "mean_token_accuracy": 0.7295340657234192, + "num_tokens": 12731798.0, + "step": 5500 + }, + { + "epoch": 0.05051801595305767, + "learning_rate": 0.00018989823049417806, + "loss": 0.9145, + "mean_token_accuracy": 0.7341712176799774, + "num_tokens": 12755263.0, + "step": 5510 + }, + { + "epoch": 0.050609700192536904, + "learning_rate": 0.0001898798936462822, + "loss": 0.9494, + "mean_token_accuracy": 0.7211965560913086, + "num_tokens": 12777560.0, + "step": 5520 + }, + { + "epoch": 0.05070138443201613, + "learning_rate": 0.00018986155679838639, + "loss": 0.9024, + "mean_token_accuracy": 0.7308406412601471, + "num_tokens": 12800675.0, + "step": 5530 + }, + { + "epoch": 0.05079306867149537, + "learning_rate": 0.00018984321995049052, + "loss": 0.9153, + "mean_token_accuracy": 0.7297637462615967, + "num_tokens": 12823598.0, + "step": 5540 + }, + { + "epoch": 0.05088475291097461, + "learning_rate": 0.00018982488310259466, + "loss": 0.9173, + "mean_token_accuracy": 0.7339243113994598, + "num_tokens": 12847125.0, + "step": 5550 + }, + { + "epoch": 0.050976437150453836, + "learning_rate": 0.00018980654625469883, + "loss": 0.8923, + "mean_token_accuracy": 0.7382059693336487, + "num_tokens": 12869988.0, + "step": 5560 + }, + { + "epoch": 0.05106812138993307, + "learning_rate": 0.00018978820940680297, + "loss": 0.8706, + "mean_token_accuracy": 0.7482873499393463, + "num_tokens": 12892199.0, + "step": 5570 + }, + { + "epoch": 0.0511598056294123, + "learning_rate": 0.00018976987255890713, + "loss": 0.9112, + "mean_token_accuracy": 0.7290290057659149, + "num_tokens": 12915562.0, + "step": 5580 + }, + { + "epoch": 0.05125148986889154, + "learning_rate": 0.0001897515357110113, + "loss": 0.8861, + "mean_token_accuracy": 0.7361009776592254, + "num_tokens": 12937961.0, + "step": 5590 + }, + { + "epoch": 0.05134317410837077, + "learning_rate": 0.00018973319886311544, + "loss": 0.8663, + "mean_token_accuracy": 0.7427524626255035, + "num_tokens": 12961230.0, + "step": 5600 + }, + { + "epoch": 0.051434858347850006, + "learning_rate": 0.0001897148620152196, + "loss": 0.8949, + "mean_token_accuracy": 0.7323137044906616, + "num_tokens": 12983738.0, + "step": 5610 + }, + { + "epoch": 0.051526542587329235, + "learning_rate": 0.00018969652516732374, + "loss": 0.9205, + "mean_token_accuracy": 0.7301993727684021, + "num_tokens": 13006233.0, + "step": 5620 + }, + { + "epoch": 0.05161822682680847, + "learning_rate": 0.0001896781883194279, + "loss": 0.9052, + "mean_token_accuracy": 0.7336772859096528, + "num_tokens": 13029753.0, + "step": 5630 + }, + { + "epoch": 0.0517099110662877, + "learning_rate": 0.00018965985147153204, + "loss": 0.8929, + "mean_token_accuracy": 0.7403875470161438, + "num_tokens": 13053550.0, + "step": 5640 + }, + { + "epoch": 0.05180159530576694, + "learning_rate": 0.0001896415146236362, + "loss": 0.935, + "mean_token_accuracy": 0.725757896900177, + "num_tokens": 13075579.0, + "step": 5650 + }, + { + "epoch": 0.051893279545246175, + "learning_rate": 0.00018962317777574037, + "loss": 0.9334, + "mean_token_accuracy": 0.7271854400634765, + "num_tokens": 13099007.0, + "step": 5660 + }, + { + "epoch": 0.051984963784725405, + "learning_rate": 0.0001896048409278445, + "loss": 0.9228, + "mean_token_accuracy": 0.7263003051280975, + "num_tokens": 13122262.0, + "step": 5670 + }, + { + "epoch": 0.05207664802420464, + "learning_rate": 0.00018958650407994868, + "loss": 0.9106, + "mean_token_accuracy": 0.7385031998157501, + "num_tokens": 13144882.0, + "step": 5680 + }, + { + "epoch": 0.05216833226368387, + "learning_rate": 0.00018956816723205282, + "loss": 0.9616, + "mean_token_accuracy": 0.723107373714447, + "num_tokens": 13168316.0, + "step": 5690 + }, + { + "epoch": 0.05226001650316311, + "learning_rate": 0.00018954983038415695, + "loss": 0.9367, + "mean_token_accuracy": 0.7253693878650666, + "num_tokens": 13191038.0, + "step": 5700 + }, + { + "epoch": 0.05235170074264234, + "learning_rate": 0.00018953149353626112, + "loss": 0.9034, + "mean_token_accuracy": 0.7317043125629425, + "num_tokens": 13213894.0, + "step": 5710 + }, + { + "epoch": 0.052443384982121574, + "learning_rate": 0.00018951315668836529, + "loss": 0.9056, + "mean_token_accuracy": 0.7340876698493958, + "num_tokens": 13237425.0, + "step": 5720 + }, + { + "epoch": 0.052535069221600804, + "learning_rate": 0.00018949481984046945, + "loss": 0.9071, + "mean_token_accuracy": 0.7308786451816559, + "num_tokens": 13261397.0, + "step": 5730 + }, + { + "epoch": 0.05262675346108004, + "learning_rate": 0.0001894764829925736, + "loss": 0.9176, + "mean_token_accuracy": 0.7290667653083801, + "num_tokens": 13283673.0, + "step": 5740 + }, + { + "epoch": 0.05271843770055928, + "learning_rate": 0.00018945814614467773, + "loss": 0.9148, + "mean_token_accuracy": 0.7335974693298339, + "num_tokens": 13306127.0, + "step": 5750 + }, + { + "epoch": 0.05281012194003851, + "learning_rate": 0.0001894398092967819, + "loss": 0.8858, + "mean_token_accuracy": 0.7394903182983399, + "num_tokens": 13328718.0, + "step": 5760 + }, + { + "epoch": 0.052901806179517744, + "learning_rate": 0.00018942147244888603, + "loss": 0.8896, + "mean_token_accuracy": 0.7327750205993653, + "num_tokens": 13351679.0, + "step": 5770 + }, + { + "epoch": 0.05299349041899697, + "learning_rate": 0.0001894031356009902, + "loss": 0.9118, + "mean_token_accuracy": 0.731440144777298, + "num_tokens": 13374935.0, + "step": 5780 + }, + { + "epoch": 0.05308517465847621, + "learning_rate": 0.00018938479875309436, + "loss": 0.8995, + "mean_token_accuracy": 0.7352271199226379, + "num_tokens": 13398259.0, + "step": 5790 + }, + { + "epoch": 0.05317685889795544, + "learning_rate": 0.0001893664619051985, + "loss": 0.8953, + "mean_token_accuracy": 0.737835818529129, + "num_tokens": 13421088.0, + "step": 5800 + }, + { + "epoch": 0.053268543137434676, + "learning_rate": 0.00018934812505730267, + "loss": 0.8999, + "mean_token_accuracy": 0.7353157579898835, + "num_tokens": 13443602.0, + "step": 5810 + }, + { + "epoch": 0.053360227376913906, + "learning_rate": 0.0001893297882094068, + "loss": 0.9085, + "mean_token_accuracy": 0.7335394084453583, + "num_tokens": 13466446.0, + "step": 5820 + }, + { + "epoch": 0.05345191161639314, + "learning_rate": 0.00018931145136151097, + "loss": 0.9248, + "mean_token_accuracy": 0.7322831153869629, + "num_tokens": 13489637.0, + "step": 5830 + }, + { + "epoch": 0.05354359585587237, + "learning_rate": 0.0001892931145136151, + "loss": 0.9242, + "mean_token_accuracy": 0.7337723314762116, + "num_tokens": 13512273.0, + "step": 5840 + }, + { + "epoch": 0.05363528009535161, + "learning_rate": 0.00018927477766571927, + "loss": 0.8608, + "mean_token_accuracy": 0.7417926669120789, + "num_tokens": 13536002.0, + "step": 5850 + }, + { + "epoch": 0.053726964334830846, + "learning_rate": 0.00018925644081782344, + "loss": 0.8768, + "mean_token_accuracy": 0.7452898561954499, + "num_tokens": 13559219.0, + "step": 5860 + }, + { + "epoch": 0.053818648574310075, + "learning_rate": 0.00018923810396992758, + "loss": 0.9125, + "mean_token_accuracy": 0.732683789730072, + "num_tokens": 13582383.0, + "step": 5870 + }, + { + "epoch": 0.05391033281378931, + "learning_rate": 0.00018921976712203174, + "loss": 0.8871, + "mean_token_accuracy": 0.7352430641651153, + "num_tokens": 13605476.0, + "step": 5880 + }, + { + "epoch": 0.05400201705326854, + "learning_rate": 0.00018920143027413588, + "loss": 0.8876, + "mean_token_accuracy": 0.7374521434307099, + "num_tokens": 13628328.0, + "step": 5890 + }, + { + "epoch": 0.05409370129274778, + "learning_rate": 0.00018918309342624002, + "loss": 0.8935, + "mean_token_accuracy": 0.7319090247154236, + "num_tokens": 13651322.0, + "step": 5900 + }, + { + "epoch": 0.05418538553222701, + "learning_rate": 0.00018916475657834418, + "loss": 0.9031, + "mean_token_accuracy": 0.7305229842662812, + "num_tokens": 13674324.0, + "step": 5910 + }, + { + "epoch": 0.054277069771706245, + "learning_rate": 0.00018914641973044835, + "loss": 0.9023, + "mean_token_accuracy": 0.733366072177887, + "num_tokens": 13696523.0, + "step": 5920 + }, + { + "epoch": 0.054368754011185474, + "learning_rate": 0.00018912808288255252, + "loss": 0.9223, + "mean_token_accuracy": 0.7279128074645996, + "num_tokens": 13719611.0, + "step": 5930 + }, + { + "epoch": 0.05446043825066471, + "learning_rate": 0.00018910974603465665, + "loss": 0.8615, + "mean_token_accuracy": 0.7450281620025635, + "num_tokens": 13743060.0, + "step": 5940 + }, + { + "epoch": 0.05455212249014394, + "learning_rate": 0.0001890914091867608, + "loss": 0.9195, + "mean_token_accuracy": 0.7355048298835755, + "num_tokens": 13766559.0, + "step": 5950 + }, + { + "epoch": 0.05464380672962318, + "learning_rate": 0.00018907307233886496, + "loss": 0.8898, + "mean_token_accuracy": 0.7425531446933746, + "num_tokens": 13789749.0, + "step": 5960 + }, + { + "epoch": 0.054735490969102414, + "learning_rate": 0.0001890547354909691, + "loss": 0.8948, + "mean_token_accuracy": 0.7356940090656281, + "num_tokens": 13813212.0, + "step": 5970 + }, + { + "epoch": 0.054827175208581644, + "learning_rate": 0.0001890363986430733, + "loss": 0.8955, + "mean_token_accuracy": 0.7427564442157746, + "num_tokens": 13836278.0, + "step": 5980 + }, + { + "epoch": 0.05491885944806088, + "learning_rate": 0.00018901806179517743, + "loss": 0.8781, + "mean_token_accuracy": 0.7427315890789032, + "num_tokens": 13858837.0, + "step": 5990 + }, + { + "epoch": 0.05501054368754011, + "learning_rate": 0.00018899972494728156, + "loss": 0.9124, + "mean_token_accuracy": 0.7382710576057434, + "num_tokens": 13882252.0, + "step": 6000 + }, + { + "epoch": 0.05510222792701935, + "learning_rate": 0.00018898138809938573, + "loss": 0.912, + "mean_token_accuracy": 0.7302774846553802, + "num_tokens": 13905670.0, + "step": 6010 + }, + { + "epoch": 0.05519391216649858, + "learning_rate": 0.00018896305125148987, + "loss": 0.8934, + "mean_token_accuracy": 0.7333192527294159, + "num_tokens": 13928573.0, + "step": 6020 + }, + { + "epoch": 0.05528559640597781, + "learning_rate": 0.00018894471440359403, + "loss": 0.9205, + "mean_token_accuracy": 0.7285143196582794, + "num_tokens": 13951207.0, + "step": 6030 + }, + { + "epoch": 0.05537728064545704, + "learning_rate": 0.00018892637755569817, + "loss": 0.8835, + "mean_token_accuracy": 0.7364872217178344, + "num_tokens": 13974493.0, + "step": 6040 + }, + { + "epoch": 0.05546896488493628, + "learning_rate": 0.00018890804070780234, + "loss": 0.8833, + "mean_token_accuracy": 0.7420256316661835, + "num_tokens": 13996879.0, + "step": 6050 + }, + { + "epoch": 0.055560649124415516, + "learning_rate": 0.0001888897038599065, + "loss": 0.9403, + "mean_token_accuracy": 0.7265816628932953, + "num_tokens": 14019520.0, + "step": 6060 + }, + { + "epoch": 0.055652333363894746, + "learning_rate": 0.00018887136701201064, + "loss": 0.9022, + "mean_token_accuracy": 0.7378275334835053, + "num_tokens": 14042872.0, + "step": 6070 + }, + { + "epoch": 0.05574401760337398, + "learning_rate": 0.0001888530301641148, + "loss": 0.896, + "mean_token_accuracy": 0.7368328273296356, + "num_tokens": 14066443.0, + "step": 6080 + }, + { + "epoch": 0.05583570184285321, + "learning_rate": 0.00018883469331621894, + "loss": 0.8456, + "mean_token_accuracy": 0.7459207534790039, + "num_tokens": 14089901.0, + "step": 6090 + }, + { + "epoch": 0.05592738608233245, + "learning_rate": 0.00018881635646832308, + "loss": 0.9238, + "mean_token_accuracy": 0.7314928591251373, + "num_tokens": 14112575.0, + "step": 6100 + }, + { + "epoch": 0.05601907032181168, + "learning_rate": 0.00018879801962042725, + "loss": 0.906, + "mean_token_accuracy": 0.7364032506942749, + "num_tokens": 14135704.0, + "step": 6110 + }, + { + "epoch": 0.056110754561290915, + "learning_rate": 0.00018877968277253141, + "loss": 0.8724, + "mean_token_accuracy": 0.7461249709129334, + "num_tokens": 14158714.0, + "step": 6120 + }, + { + "epoch": 0.056202438800770145, + "learning_rate": 0.00018876134592463558, + "loss": 0.9115, + "mean_token_accuracy": 0.7310883283615113, + "num_tokens": 14181618.0, + "step": 6130 + }, + { + "epoch": 0.05629412304024938, + "learning_rate": 0.00018874300907673972, + "loss": 0.9306, + "mean_token_accuracy": 0.7311136484146118, + "num_tokens": 14204124.0, + "step": 6140 + }, + { + "epoch": 0.05638580727972861, + "learning_rate": 0.00018872467222884386, + "loss": 0.8831, + "mean_token_accuracy": 0.7353039979934692, + "num_tokens": 14226147.0, + "step": 6150 + }, + { + "epoch": 0.05647749151920785, + "learning_rate": 0.00018870633538094802, + "loss": 0.9053, + "mean_token_accuracy": 0.7393592476844788, + "num_tokens": 14249515.0, + "step": 6160 + }, + { + "epoch": 0.056569175758687085, + "learning_rate": 0.00018868799853305216, + "loss": 0.8776, + "mean_token_accuracy": 0.7368683636188507, + "num_tokens": 14272137.0, + "step": 6170 + }, + { + "epoch": 0.056660859998166314, + "learning_rate": 0.00018866966168515635, + "loss": 0.9018, + "mean_token_accuracy": 0.733753764629364, + "num_tokens": 14295267.0, + "step": 6180 + }, + { + "epoch": 0.05675254423764555, + "learning_rate": 0.0001886513248372605, + "loss": 0.9312, + "mean_token_accuracy": 0.731525057554245, + "num_tokens": 14318197.0, + "step": 6190 + }, + { + "epoch": 0.05684422847712478, + "learning_rate": 0.00018863298798936463, + "loss": 0.9351, + "mean_token_accuracy": 0.7326232314109802, + "num_tokens": 14341827.0, + "step": 6200 + }, + { + "epoch": 0.05693591271660402, + "learning_rate": 0.0001886146511414688, + "loss": 0.9383, + "mean_token_accuracy": 0.7253555476665496, + "num_tokens": 14364640.0, + "step": 6210 + }, + { + "epoch": 0.05702759695608325, + "learning_rate": 0.00018859631429357293, + "loss": 0.9435, + "mean_token_accuracy": 0.7301494657993317, + "num_tokens": 14388414.0, + "step": 6220 + }, + { + "epoch": 0.057119281195562484, + "learning_rate": 0.0001885779774456771, + "loss": 0.907, + "mean_token_accuracy": 0.7335768043994904, + "num_tokens": 14411936.0, + "step": 6230 + }, + { + "epoch": 0.057210965435041714, + "learning_rate": 0.00018855964059778124, + "loss": 0.9083, + "mean_token_accuracy": 0.7336957097053528, + "num_tokens": 14434648.0, + "step": 6240 + }, + { + "epoch": 0.05730264967452095, + "learning_rate": 0.0001885413037498854, + "loss": 0.85, + "mean_token_accuracy": 0.744956886768341, + "num_tokens": 14456764.0, + "step": 6250 + }, + { + "epoch": 0.05739433391400019, + "learning_rate": 0.00018852296690198957, + "loss": 0.8716, + "mean_token_accuracy": 0.7397426307201386, + "num_tokens": 14479853.0, + "step": 6260 + }, + { + "epoch": 0.057486018153479417, + "learning_rate": 0.0001885046300540937, + "loss": 0.8937, + "mean_token_accuracy": 0.7402728736400604, + "num_tokens": 14503349.0, + "step": 6270 + }, + { + "epoch": 0.05757770239295865, + "learning_rate": 0.00018848629320619787, + "loss": 0.9142, + "mean_token_accuracy": 0.7332817733287811, + "num_tokens": 14526076.0, + "step": 6280 + }, + { + "epoch": 0.05766938663243788, + "learning_rate": 0.000188467956358302, + "loss": 0.9258, + "mean_token_accuracy": 0.7274915874004364, + "num_tokens": 14549465.0, + "step": 6290 + }, + { + "epoch": 0.05776107087191712, + "learning_rate": 0.00018844961951040615, + "loss": 0.9064, + "mean_token_accuracy": 0.7345609068870544, + "num_tokens": 14573191.0, + "step": 6300 + }, + { + "epoch": 0.05785275511139635, + "learning_rate": 0.00018843128266251034, + "loss": 0.9096, + "mean_token_accuracy": 0.734123432636261, + "num_tokens": 14596590.0, + "step": 6310 + }, + { + "epoch": 0.057944439350875586, + "learning_rate": 0.00018841294581461448, + "loss": 0.8964, + "mean_token_accuracy": 0.7332545578479767, + "num_tokens": 14619528.0, + "step": 6320 + }, + { + "epoch": 0.058036123590354816, + "learning_rate": 0.00018839460896671864, + "loss": 0.8747, + "mean_token_accuracy": 0.7394288897514343, + "num_tokens": 14643136.0, + "step": 6330 + }, + { + "epoch": 0.05812780782983405, + "learning_rate": 0.00018837627211882278, + "loss": 0.9034, + "mean_token_accuracy": 0.739733350276947, + "num_tokens": 14665759.0, + "step": 6340 + }, + { + "epoch": 0.05821949206931328, + "learning_rate": 0.00018835793527092692, + "loss": 0.8784, + "mean_token_accuracy": 0.7444514751434326, + "num_tokens": 14688597.0, + "step": 6350 + }, + { + "epoch": 0.05831117630879252, + "learning_rate": 0.00018833959842303109, + "loss": 0.9192, + "mean_token_accuracy": 0.7293457150459289, + "num_tokens": 14712072.0, + "step": 6360 + }, + { + "epoch": 0.058402860548271755, + "learning_rate": 0.00018832126157513522, + "loss": 0.9162, + "mean_token_accuracy": 0.7286231815814972, + "num_tokens": 14735369.0, + "step": 6370 + }, + { + "epoch": 0.058494544787750985, + "learning_rate": 0.00018830292472723942, + "loss": 0.8805, + "mean_token_accuracy": 0.7397731244564056, + "num_tokens": 14757974.0, + "step": 6380 + }, + { + "epoch": 0.05858622902723022, + "learning_rate": 0.00018828458787934356, + "loss": 0.9018, + "mean_token_accuracy": 0.7344457864761352, + "num_tokens": 14780663.0, + "step": 6390 + }, + { + "epoch": 0.05867791326670945, + "learning_rate": 0.0001882662510314477, + "loss": 0.9278, + "mean_token_accuracy": 0.73030526638031, + "num_tokens": 14803159.0, + "step": 6400 + }, + { + "epoch": 0.05876959750618869, + "learning_rate": 0.00018824791418355186, + "loss": 0.8956, + "mean_token_accuracy": 0.7391948223114013, + "num_tokens": 14826264.0, + "step": 6410 + }, + { + "epoch": 0.05886128174566792, + "learning_rate": 0.000188229577335656, + "loss": 0.9161, + "mean_token_accuracy": 0.7264982461929321, + "num_tokens": 14849010.0, + "step": 6420 + }, + { + "epoch": 0.058952965985147154, + "learning_rate": 0.00018821124048776016, + "loss": 0.893, + "mean_token_accuracy": 0.7374953508377076, + "num_tokens": 14872077.0, + "step": 6430 + }, + { + "epoch": 0.059044650224626384, + "learning_rate": 0.00018819290363986433, + "loss": 0.9364, + "mean_token_accuracy": 0.7247084021568299, + "num_tokens": 14895186.0, + "step": 6440 + }, + { + "epoch": 0.05913633446410562, + "learning_rate": 0.00018817456679196847, + "loss": 0.8867, + "mean_token_accuracy": 0.7435551762580872, + "num_tokens": 14917517.0, + "step": 6450 + }, + { + "epoch": 0.05922801870358485, + "learning_rate": 0.00018815622994407263, + "loss": 0.872, + "mean_token_accuracy": 0.7501089930534363, + "num_tokens": 14940031.0, + "step": 6460 + }, + { + "epoch": 0.05931970294306409, + "learning_rate": 0.00018813789309617677, + "loss": 0.8952, + "mean_token_accuracy": 0.7309714913368225, + "num_tokens": 14963179.0, + "step": 6470 + }, + { + "epoch": 0.059411387182543324, + "learning_rate": 0.00018811955624828094, + "loss": 0.873, + "mean_token_accuracy": 0.7429340958595276, + "num_tokens": 14985751.0, + "step": 6480 + }, + { + "epoch": 0.05950307142202255, + "learning_rate": 0.00018810121940038507, + "loss": 0.8904, + "mean_token_accuracy": 0.7367467224597931, + "num_tokens": 15008446.0, + "step": 6490 + }, + { + "epoch": 0.05959475566150179, + "learning_rate": 0.0001880828825524892, + "loss": 0.8634, + "mean_token_accuracy": 0.7398522615432739, + "num_tokens": 15031349.0, + "step": 6500 + }, + { + "epoch": 0.05968643990098102, + "learning_rate": 0.0001880645457045934, + "loss": 0.8951, + "mean_token_accuracy": 0.7324127376079559, + "num_tokens": 15054551.0, + "step": 6510 + }, + { + "epoch": 0.059778124140460256, + "learning_rate": 0.00018804620885669754, + "loss": 0.8648, + "mean_token_accuracy": 0.7435194730758667, + "num_tokens": 15078018.0, + "step": 6520 + }, + { + "epoch": 0.059869808379939486, + "learning_rate": 0.0001880278720088017, + "loss": 0.8842, + "mean_token_accuracy": 0.743254816532135, + "num_tokens": 15101025.0, + "step": 6530 + }, + { + "epoch": 0.05996149261941872, + "learning_rate": 0.00018800953516090585, + "loss": 0.8871, + "mean_token_accuracy": 0.7371959745883941, + "num_tokens": 15124153.0, + "step": 6540 + }, + { + "epoch": 0.06005317685889795, + "learning_rate": 0.00018799119831300999, + "loss": 0.8699, + "mean_token_accuracy": 0.7455730557441711, + "num_tokens": 15147110.0, + "step": 6550 + }, + { + "epoch": 0.06014486109837719, + "learning_rate": 0.00018797286146511415, + "loss": 0.9192, + "mean_token_accuracy": 0.7300807714462281, + "num_tokens": 15170377.0, + "step": 6560 + }, + { + "epoch": 0.060236545337856426, + "learning_rate": 0.00018795452461721832, + "loss": 0.9205, + "mean_token_accuracy": 0.7324627101421356, + "num_tokens": 15194174.0, + "step": 6570 + }, + { + "epoch": 0.060328229577335656, + "learning_rate": 0.00018793618776932248, + "loss": 0.875, + "mean_token_accuracy": 0.7377755105495453, + "num_tokens": 15217608.0, + "step": 6580 + }, + { + "epoch": 0.06041991381681489, + "learning_rate": 0.00018791785092142662, + "loss": 0.8978, + "mean_token_accuracy": 0.7367534399032593, + "num_tokens": 15240404.0, + "step": 6590 + }, + { + "epoch": 0.06051159805629412, + "learning_rate": 0.00018789951407353076, + "loss": 0.9103, + "mean_token_accuracy": 0.7309245347976685, + "num_tokens": 15262817.0, + "step": 6600 + }, + { + "epoch": 0.06060328229577336, + "learning_rate": 0.00018788117722563492, + "loss": 0.8727, + "mean_token_accuracy": 0.7372923493385315, + "num_tokens": 15286113.0, + "step": 6610 + }, + { + "epoch": 0.06069496653525259, + "learning_rate": 0.00018786284037773906, + "loss": 0.8703, + "mean_token_accuracy": 0.7400227010250091, + "num_tokens": 15309220.0, + "step": 6620 + }, + { + "epoch": 0.060786650774731825, + "learning_rate": 0.00018784450352984323, + "loss": 0.9371, + "mean_token_accuracy": 0.7229818522930145, + "num_tokens": 15332332.0, + "step": 6630 + }, + { + "epoch": 0.060878335014211055, + "learning_rate": 0.0001878261666819474, + "loss": 0.8735, + "mean_token_accuracy": 0.7370070874691009, + "num_tokens": 15355692.0, + "step": 6640 + }, + { + "epoch": 0.06097001925369029, + "learning_rate": 0.00018780782983405153, + "loss": 0.9187, + "mean_token_accuracy": 0.7303988337516785, + "num_tokens": 15378602.0, + "step": 6650 + }, + { + "epoch": 0.06106170349316952, + "learning_rate": 0.0001877894929861557, + "loss": 0.8962, + "mean_token_accuracy": 0.7402011632919312, + "num_tokens": 15403457.0, + "step": 6660 + }, + { + "epoch": 0.06115338773264876, + "learning_rate": 0.00018777115613825983, + "loss": 0.8651, + "mean_token_accuracy": 0.7377009212970733, + "num_tokens": 15426229.0, + "step": 6670 + }, + { + "epoch": 0.061245071972127994, + "learning_rate": 0.000187752819290364, + "loss": 0.9219, + "mean_token_accuracy": 0.7281396806240081, + "num_tokens": 15449562.0, + "step": 6680 + }, + { + "epoch": 0.061336756211607224, + "learning_rate": 0.00018773448244246814, + "loss": 0.8789, + "mean_token_accuracy": 0.7357682764530182, + "num_tokens": 15473220.0, + "step": 6690 + }, + { + "epoch": 0.06142844045108646, + "learning_rate": 0.0001877161455945723, + "loss": 0.8652, + "mean_token_accuracy": 0.7406415164470672, + "num_tokens": 15496530.0, + "step": 6700 + }, + { + "epoch": 0.06152012469056569, + "learning_rate": 0.00018769780874667647, + "loss": 0.8978, + "mean_token_accuracy": 0.7423011541366578, + "num_tokens": 15519869.0, + "step": 6710 + }, + { + "epoch": 0.06161180893004493, + "learning_rate": 0.0001876794718987806, + "loss": 0.8602, + "mean_token_accuracy": 0.7424899756908416, + "num_tokens": 15542720.0, + "step": 6720 + }, + { + "epoch": 0.06170349316952416, + "learning_rate": 0.00018766113505088477, + "loss": 0.8759, + "mean_token_accuracy": 0.7321468591690063, + "num_tokens": 15565691.0, + "step": 6730 + }, + { + "epoch": 0.06179517740900339, + "learning_rate": 0.0001876427982029889, + "loss": 0.9021, + "mean_token_accuracy": 0.7332452654838562, + "num_tokens": 15587986.0, + "step": 6740 + }, + { + "epoch": 0.06188686164848262, + "learning_rate": 0.00018762446135509305, + "loss": 0.9058, + "mean_token_accuracy": 0.7323048353195191, + "num_tokens": 15611069.0, + "step": 6750 + }, + { + "epoch": 0.06197854588796186, + "learning_rate": 0.00018760612450719721, + "loss": 0.9216, + "mean_token_accuracy": 0.7371990263462067, + "num_tokens": 15634139.0, + "step": 6760 + }, + { + "epoch": 0.06207023012744109, + "learning_rate": 0.00018758778765930138, + "loss": 0.8878, + "mean_token_accuracy": 0.7320496499538421, + "num_tokens": 15657348.0, + "step": 6770 + }, + { + "epoch": 0.062161914366920326, + "learning_rate": 0.00018756945081140555, + "loss": 0.9143, + "mean_token_accuracy": 0.7285496592521667, + "num_tokens": 15680247.0, + "step": 6780 + }, + { + "epoch": 0.06225359860639956, + "learning_rate": 0.00018755111396350968, + "loss": 0.8648, + "mean_token_accuracy": 0.7439673006534576, + "num_tokens": 15703156.0, + "step": 6790 + }, + { + "epoch": 0.06234528284587879, + "learning_rate": 0.00018753277711561382, + "loss": 0.8835, + "mean_token_accuracy": 0.7361136078834534, + "num_tokens": 15725451.0, + "step": 6800 + }, + { + "epoch": 0.06243696708535803, + "learning_rate": 0.000187514440267718, + "loss": 0.8724, + "mean_token_accuracy": 0.7394465565681457, + "num_tokens": 15748133.0, + "step": 6810 + }, + { + "epoch": 0.06252865132483726, + "learning_rate": 0.00018749610341982213, + "loss": 0.884, + "mean_token_accuracy": 0.7421841084957123, + "num_tokens": 15771816.0, + "step": 6820 + }, + { + "epoch": 0.0626203355643165, + "learning_rate": 0.00018747776657192632, + "loss": 0.9246, + "mean_token_accuracy": 0.7252350389957428, + "num_tokens": 15795042.0, + "step": 6830 + }, + { + "epoch": 0.06271201980379573, + "learning_rate": 0.00018745942972403046, + "loss": 0.9047, + "mean_token_accuracy": 0.7368955314159393, + "num_tokens": 15818614.0, + "step": 6840 + }, + { + "epoch": 0.06280370404327495, + "learning_rate": 0.0001874410928761346, + "loss": 0.8984, + "mean_token_accuracy": 0.7376978814601898, + "num_tokens": 15841511.0, + "step": 6850 + }, + { + "epoch": 0.06289538828275419, + "learning_rate": 0.00018742275602823876, + "loss": 0.9005, + "mean_token_accuracy": 0.7304648399353028, + "num_tokens": 15864316.0, + "step": 6860 + }, + { + "epoch": 0.06298707252223343, + "learning_rate": 0.0001874044191803429, + "loss": 0.8921, + "mean_token_accuracy": 0.7313158929347991, + "num_tokens": 15887153.0, + "step": 6870 + }, + { + "epoch": 0.06307875676171266, + "learning_rate": 0.00018738608233244706, + "loss": 0.893, + "mean_token_accuracy": 0.7359376966953277, + "num_tokens": 15910352.0, + "step": 6880 + }, + { + "epoch": 0.0631704410011919, + "learning_rate": 0.0001873677454845512, + "loss": 0.8977, + "mean_token_accuracy": 0.7376785218715668, + "num_tokens": 15933915.0, + "step": 6890 + }, + { + "epoch": 0.06326212524067112, + "learning_rate": 0.00018734940863665537, + "loss": 0.9317, + "mean_token_accuracy": 0.7326904177665711, + "num_tokens": 15957172.0, + "step": 6900 + }, + { + "epoch": 0.06335380948015036, + "learning_rate": 0.00018733107178875953, + "loss": 0.8774, + "mean_token_accuracy": 0.7328968286514282, + "num_tokens": 15980904.0, + "step": 6910 + }, + { + "epoch": 0.0634454937196296, + "learning_rate": 0.00018731273494086367, + "loss": 0.898, + "mean_token_accuracy": 0.7409002304077148, + "num_tokens": 16004324.0, + "step": 6920 + }, + { + "epoch": 0.06353717795910883, + "learning_rate": 0.00018729439809296784, + "loss": 0.8682, + "mean_token_accuracy": 0.7439389050006866, + "num_tokens": 16026946.0, + "step": 6930 + }, + { + "epoch": 0.06362886219858806, + "learning_rate": 0.00018727606124507198, + "loss": 0.9173, + "mean_token_accuracy": 0.7388446688652038, + "num_tokens": 16050303.0, + "step": 6940 + }, + { + "epoch": 0.0637205464380673, + "learning_rate": 0.00018725772439717611, + "loss": 0.9191, + "mean_token_accuracy": 0.7310415506362915, + "num_tokens": 16072316.0, + "step": 6950 + }, + { + "epoch": 0.06381223067754653, + "learning_rate": 0.0001872393875492803, + "loss": 0.8931, + "mean_token_accuracy": 0.7374844074249267, + "num_tokens": 16095978.0, + "step": 6960 + }, + { + "epoch": 0.06390391491702577, + "learning_rate": 0.00018722105070138444, + "loss": 0.8632, + "mean_token_accuracy": 0.7394248306751251, + "num_tokens": 16119124.0, + "step": 6970 + }, + { + "epoch": 0.063995599156505, + "learning_rate": 0.0001872027138534886, + "loss": 0.9068, + "mean_token_accuracy": 0.732264769077301, + "num_tokens": 16142278.0, + "step": 6980 + }, + { + "epoch": 0.06408728339598423, + "learning_rate": 0.00018718437700559275, + "loss": 0.8759, + "mean_token_accuracy": 0.7376603662967682, + "num_tokens": 16165905.0, + "step": 6990 + }, + { + "epoch": 0.06417896763546346, + "learning_rate": 0.0001871660401576969, + "loss": 0.9255, + "mean_token_accuracy": 0.7317251801490784, + "num_tokens": 16189684.0, + "step": 7000 + }, + { + "epoch": 0.0642706518749427, + "learning_rate": 0.00018714770330980105, + "loss": 0.9138, + "mean_token_accuracy": 0.7325927197933197, + "num_tokens": 16212901.0, + "step": 7010 + }, + { + "epoch": 0.06436233611442194, + "learning_rate": 0.0001871293664619052, + "loss": 0.9256, + "mean_token_accuracy": 0.7301843285560607, + "num_tokens": 16236792.0, + "step": 7020 + }, + { + "epoch": 0.06445402035390116, + "learning_rate": 0.00018711102961400938, + "loss": 0.874, + "mean_token_accuracy": 0.7444778919219971, + "num_tokens": 16260056.0, + "step": 7030 + }, + { + "epoch": 0.0645457045933804, + "learning_rate": 0.00018709269276611352, + "loss": 0.9333, + "mean_token_accuracy": 0.7293393611907959, + "num_tokens": 16282761.0, + "step": 7040 + }, + { + "epoch": 0.06463738883285963, + "learning_rate": 0.00018707435591821766, + "loss": 0.8976, + "mean_token_accuracy": 0.7393335163593292, + "num_tokens": 16305315.0, + "step": 7050 + }, + { + "epoch": 0.06472907307233887, + "learning_rate": 0.00018705601907032183, + "loss": 0.9162, + "mean_token_accuracy": 0.7291788518428802, + "num_tokens": 16328631.0, + "step": 7060 + }, + { + "epoch": 0.06482075731181809, + "learning_rate": 0.00018703768222242596, + "loss": 0.8899, + "mean_token_accuracy": 0.7410358488559723, + "num_tokens": 16351733.0, + "step": 7070 + }, + { + "epoch": 0.06491244155129733, + "learning_rate": 0.00018701934537453013, + "loss": 0.8874, + "mean_token_accuracy": 0.7387078881263733, + "num_tokens": 16374963.0, + "step": 7080 + }, + { + "epoch": 0.06500412579077657, + "learning_rate": 0.0001870010085266343, + "loss": 0.9475, + "mean_token_accuracy": 0.7295987010002136, + "num_tokens": 16397461.0, + "step": 7090 + }, + { + "epoch": 0.0650958100302558, + "learning_rate": 0.00018698267167873843, + "loss": 0.8814, + "mean_token_accuracy": 0.7374467432498932, + "num_tokens": 16420852.0, + "step": 7100 + }, + { + "epoch": 0.06518749426973504, + "learning_rate": 0.0001869643348308426, + "loss": 0.8845, + "mean_token_accuracy": 0.739473843574524, + "num_tokens": 16444586.0, + "step": 7110 + }, + { + "epoch": 0.06527917850921426, + "learning_rate": 0.00018694599798294674, + "loss": 0.8925, + "mean_token_accuracy": 0.731457096338272, + "num_tokens": 16467033.0, + "step": 7120 + }, + { + "epoch": 0.0653708627486935, + "learning_rate": 0.0001869276611350509, + "loss": 0.9007, + "mean_token_accuracy": 0.7407608687877655, + "num_tokens": 16489861.0, + "step": 7130 + }, + { + "epoch": 0.06546254698817273, + "learning_rate": 0.00018690932428715504, + "loss": 0.8853, + "mean_token_accuracy": 0.7345590412616729, + "num_tokens": 16513864.0, + "step": 7140 + }, + { + "epoch": 0.06555423122765197, + "learning_rate": 0.00018689098743925918, + "loss": 0.8828, + "mean_token_accuracy": 0.7381375849246978, + "num_tokens": 16537198.0, + "step": 7150 + }, + { + "epoch": 0.0656459154671312, + "learning_rate": 0.00018687265059136337, + "loss": 0.884, + "mean_token_accuracy": 0.7393272697925568, + "num_tokens": 16560335.0, + "step": 7160 + }, + { + "epoch": 0.06573759970661043, + "learning_rate": 0.0001868543137434675, + "loss": 0.8972, + "mean_token_accuracy": 0.736215102672577, + "num_tokens": 16583397.0, + "step": 7170 + }, + { + "epoch": 0.06582928394608967, + "learning_rate": 0.00018683597689557167, + "loss": 0.9127, + "mean_token_accuracy": 0.7304023504257202, + "num_tokens": 16605837.0, + "step": 7180 + }, + { + "epoch": 0.0659209681855689, + "learning_rate": 0.0001868176400476758, + "loss": 0.8992, + "mean_token_accuracy": 0.735389119386673, + "num_tokens": 16629642.0, + "step": 7190 + }, + { + "epoch": 0.06601265242504814, + "learning_rate": 0.00018679930319977995, + "loss": 0.917, + "mean_token_accuracy": 0.7340928137302398, + "num_tokens": 16652890.0, + "step": 7200 + }, + { + "epoch": 0.06610433666452736, + "learning_rate": 0.00018678096635188412, + "loss": 0.9363, + "mean_token_accuracy": 0.7297744393348694, + "num_tokens": 16676579.0, + "step": 7210 + }, + { + "epoch": 0.0661960209040066, + "learning_rate": 0.00018676262950398826, + "loss": 0.8672, + "mean_token_accuracy": 0.7379568219184875, + "num_tokens": 16700076.0, + "step": 7220 + }, + { + "epoch": 0.06628770514348584, + "learning_rate": 0.00018674429265609245, + "loss": 0.9195, + "mean_token_accuracy": 0.7359227120876313, + "num_tokens": 16724267.0, + "step": 7230 + }, + { + "epoch": 0.06637938938296507, + "learning_rate": 0.00018672595580819659, + "loss": 0.9032, + "mean_token_accuracy": 0.7368239104747772, + "num_tokens": 16747543.0, + "step": 7240 + }, + { + "epoch": 0.0664710736224443, + "learning_rate": 0.00018670761896030072, + "loss": 0.9144, + "mean_token_accuracy": 0.7297830283641815, + "num_tokens": 16771820.0, + "step": 7250 + }, + { + "epoch": 0.06656275786192353, + "learning_rate": 0.0001866892821124049, + "loss": 0.8988, + "mean_token_accuracy": 0.7404946625232697, + "num_tokens": 16795665.0, + "step": 7260 + }, + { + "epoch": 0.06665444210140277, + "learning_rate": 0.00018667094526450903, + "loss": 0.8852, + "mean_token_accuracy": 0.7353927493095398, + "num_tokens": 16819389.0, + "step": 7270 + }, + { + "epoch": 0.066746126340882, + "learning_rate": 0.0001866526084166132, + "loss": 0.8787, + "mean_token_accuracy": 0.7369317412376404, + "num_tokens": 16842826.0, + "step": 7280 + }, + { + "epoch": 0.06683781058036124, + "learning_rate": 0.00018663427156871736, + "loss": 0.8929, + "mean_token_accuracy": 0.7297127783298493, + "num_tokens": 16866166.0, + "step": 7290 + }, + { + "epoch": 0.06692949481984047, + "learning_rate": 0.0001866159347208215, + "loss": 0.874, + "mean_token_accuracy": 0.7410301506519318, + "num_tokens": 16888677.0, + "step": 7300 + }, + { + "epoch": 0.0670211790593197, + "learning_rate": 0.00018659759787292566, + "loss": 0.889, + "mean_token_accuracy": 0.7322735846042633, + "num_tokens": 16912050.0, + "step": 7310 + }, + { + "epoch": 0.06711286329879894, + "learning_rate": 0.0001865792610250298, + "loss": 0.8856, + "mean_token_accuracy": 0.7414264559745789, + "num_tokens": 16935508.0, + "step": 7320 + }, + { + "epoch": 0.06720454753827818, + "learning_rate": 0.00018656092417713397, + "loss": 0.9075, + "mean_token_accuracy": 0.7362886309623718, + "num_tokens": 16958563.0, + "step": 7330 + }, + { + "epoch": 0.0672962317777574, + "learning_rate": 0.0001865425873292381, + "loss": 0.915, + "mean_token_accuracy": 0.7296898543834687, + "num_tokens": 16982051.0, + "step": 7340 + }, + { + "epoch": 0.06738791601723663, + "learning_rate": 0.00018652425048134224, + "loss": 0.8964, + "mean_token_accuracy": 0.7311189293861389, + "num_tokens": 17004712.0, + "step": 7350 + }, + { + "epoch": 0.06747960025671587, + "learning_rate": 0.00018650591363344644, + "loss": 0.9058, + "mean_token_accuracy": 0.7329726874828338, + "num_tokens": 17028050.0, + "step": 7360 + }, + { + "epoch": 0.06757128449619511, + "learning_rate": 0.00018648757678555057, + "loss": 0.9303, + "mean_token_accuracy": 0.7248231410980225, + "num_tokens": 17051053.0, + "step": 7370 + }, + { + "epoch": 0.06766296873567433, + "learning_rate": 0.00018646923993765474, + "loss": 0.8843, + "mean_token_accuracy": 0.7385094702243805, + "num_tokens": 17073754.0, + "step": 7380 + }, + { + "epoch": 0.06775465297515357, + "learning_rate": 0.00018645090308975888, + "loss": 0.9123, + "mean_token_accuracy": 0.7319236874580384, + "num_tokens": 17097349.0, + "step": 7390 + }, + { + "epoch": 0.0678463372146328, + "learning_rate": 0.00018643256624186302, + "loss": 0.8846, + "mean_token_accuracy": 0.7347530663013458, + "num_tokens": 17120271.0, + "step": 7400 + }, + { + "epoch": 0.06793802145411204, + "learning_rate": 0.00018641422939396718, + "loss": 0.9098, + "mean_token_accuracy": 0.7334261775016785, + "num_tokens": 17143657.0, + "step": 7410 + }, + { + "epoch": 0.06802970569359128, + "learning_rate": 0.00018639589254607135, + "loss": 0.9247, + "mean_token_accuracy": 0.7289936065673828, + "num_tokens": 17166438.0, + "step": 7420 + }, + { + "epoch": 0.0681213899330705, + "learning_rate": 0.0001863775556981755, + "loss": 0.9361, + "mean_token_accuracy": 0.7277748346328735, + "num_tokens": 17189881.0, + "step": 7430 + }, + { + "epoch": 0.06821307417254974, + "learning_rate": 0.00018635921885027965, + "loss": 0.8601, + "mean_token_accuracy": 0.7468758761882782, + "num_tokens": 17213078.0, + "step": 7440 + }, + { + "epoch": 0.06830475841202897, + "learning_rate": 0.0001863408820023838, + "loss": 0.9185, + "mean_token_accuracy": 0.7321870148181915, + "num_tokens": 17236890.0, + "step": 7450 + }, + { + "epoch": 0.06839644265150821, + "learning_rate": 0.00018632254515448795, + "loss": 0.882, + "mean_token_accuracy": 0.7418410241603851, + "num_tokens": 17259974.0, + "step": 7460 + }, + { + "epoch": 0.06848812689098743, + "learning_rate": 0.0001863042083065921, + "loss": 0.8628, + "mean_token_accuracy": 0.7472536444664002, + "num_tokens": 17283370.0, + "step": 7470 + }, + { + "epoch": 0.06857981113046667, + "learning_rate": 0.00018628587145869626, + "loss": 0.8835, + "mean_token_accuracy": 0.7388462424278259, + "num_tokens": 17306312.0, + "step": 7480 + }, + { + "epoch": 0.0686714953699459, + "learning_rate": 0.00018626753461080042, + "loss": 0.9212, + "mean_token_accuracy": 0.7299582719802856, + "num_tokens": 17328831.0, + "step": 7490 + }, + { + "epoch": 0.06876317960942514, + "learning_rate": 0.00018624919776290456, + "loss": 0.8588, + "mean_token_accuracy": 0.7480060636997223, + "num_tokens": 17352124.0, + "step": 7500 + }, + { + "epoch": 0.06885486384890438, + "learning_rate": 0.00018623086091500873, + "loss": 0.919, + "mean_token_accuracy": 0.735031658411026, + "num_tokens": 17376609.0, + "step": 7510 + }, + { + "epoch": 0.0689465480883836, + "learning_rate": 0.00018621252406711287, + "loss": 0.8857, + "mean_token_accuracy": 0.7383214592933655, + "num_tokens": 17399810.0, + "step": 7520 + }, + { + "epoch": 0.06903823232786284, + "learning_rate": 0.00018619418721921703, + "loss": 0.8489, + "mean_token_accuracy": 0.744429212808609, + "num_tokens": 17422162.0, + "step": 7530 + }, + { + "epoch": 0.06912991656734208, + "learning_rate": 0.00018617585037132117, + "loss": 0.8776, + "mean_token_accuracy": 0.7415482640266419, + "num_tokens": 17445079.0, + "step": 7540 + }, + { + "epoch": 0.06922160080682131, + "learning_rate": 0.00018615751352342533, + "loss": 0.8773, + "mean_token_accuracy": 0.7432332038879395, + "num_tokens": 17467641.0, + "step": 7550 + }, + { + "epoch": 0.06931328504630054, + "learning_rate": 0.0001861391766755295, + "loss": 0.8946, + "mean_token_accuracy": 0.7381612658500671, + "num_tokens": 17491272.0, + "step": 7560 + }, + { + "epoch": 0.06940496928577977, + "learning_rate": 0.00018612083982763364, + "loss": 0.8861, + "mean_token_accuracy": 0.742399537563324, + "num_tokens": 17514326.0, + "step": 7570 + }, + { + "epoch": 0.06949665352525901, + "learning_rate": 0.0001861025029797378, + "loss": 0.8719, + "mean_token_accuracy": 0.7429358124732971, + "num_tokens": 17538380.0, + "step": 7580 + }, + { + "epoch": 0.06958833776473825, + "learning_rate": 0.00018608416613184194, + "loss": 0.8753, + "mean_token_accuracy": 0.7393517673015595, + "num_tokens": 17562048.0, + "step": 7590 + }, + { + "epoch": 0.06968002200421748, + "learning_rate": 0.00018606582928394608, + "loss": 0.9625, + "mean_token_accuracy": 0.7224134266376495, + "num_tokens": 17584969.0, + "step": 7600 + }, + { + "epoch": 0.0697717062436967, + "learning_rate": 0.00018604749243605025, + "loss": 0.9035, + "mean_token_accuracy": 0.7296406388282776, + "num_tokens": 17608461.0, + "step": 7610 + }, + { + "epoch": 0.06986339048317594, + "learning_rate": 0.0001860291555881544, + "loss": 0.8754, + "mean_token_accuracy": 0.7468557894229889, + "num_tokens": 17631323.0, + "step": 7620 + }, + { + "epoch": 0.06995507472265518, + "learning_rate": 0.00018601081874025858, + "loss": 0.9026, + "mean_token_accuracy": 0.7325952231884003, + "num_tokens": 17655593.0, + "step": 7630 + }, + { + "epoch": 0.07004675896213441, + "learning_rate": 0.00018599248189236271, + "loss": 0.8996, + "mean_token_accuracy": 0.7371292054653168, + "num_tokens": 17678836.0, + "step": 7640 + }, + { + "epoch": 0.07013844320161364, + "learning_rate": 0.00018597414504446685, + "loss": 0.8808, + "mean_token_accuracy": 0.7433316528797149, + "num_tokens": 17702229.0, + "step": 7650 + }, + { + "epoch": 0.07023012744109287, + "learning_rate": 0.00018595580819657102, + "loss": 0.8986, + "mean_token_accuracy": 0.7327707171440124, + "num_tokens": 17725528.0, + "step": 7660 + }, + { + "epoch": 0.07032181168057211, + "learning_rate": 0.00018593747134867516, + "loss": 0.885, + "mean_token_accuracy": 0.7369406819343567, + "num_tokens": 17747838.0, + "step": 7670 + }, + { + "epoch": 0.07041349592005135, + "learning_rate": 0.00018591913450077932, + "loss": 0.9538, + "mean_token_accuracy": 0.7233248591423035, + "num_tokens": 17771786.0, + "step": 7680 + }, + { + "epoch": 0.07050518015953057, + "learning_rate": 0.0001859007976528835, + "loss": 0.9146, + "mean_token_accuracy": 0.7280868113040924, + "num_tokens": 17794416.0, + "step": 7690 + }, + { + "epoch": 0.0705968643990098, + "learning_rate": 0.00018588246080498763, + "loss": 0.9179, + "mean_token_accuracy": 0.7320180058479309, + "num_tokens": 17818764.0, + "step": 7700 + }, + { + "epoch": 0.07068854863848904, + "learning_rate": 0.0001858641239570918, + "loss": 0.8764, + "mean_token_accuracy": 0.7389637172222138, + "num_tokens": 17841747.0, + "step": 7710 + }, + { + "epoch": 0.07078023287796828, + "learning_rate": 0.00018584578710919593, + "loss": 0.9236, + "mean_token_accuracy": 0.7238744258880615, + "num_tokens": 17864897.0, + "step": 7720 + }, + { + "epoch": 0.07087191711744752, + "learning_rate": 0.0001858274502613001, + "loss": 0.9008, + "mean_token_accuracy": 0.7376737713813781, + "num_tokens": 17888390.0, + "step": 7730 + }, + { + "epoch": 0.07096360135692674, + "learning_rate": 0.00018580911341340423, + "loss": 0.9364, + "mean_token_accuracy": 0.7339943230152131, + "num_tokens": 17911341.0, + "step": 7740 + }, + { + "epoch": 0.07105528559640598, + "learning_rate": 0.0001857907765655084, + "loss": 0.8868, + "mean_token_accuracy": 0.7426157474517823, + "num_tokens": 17933928.0, + "step": 7750 + }, + { + "epoch": 0.07114696983588521, + "learning_rate": 0.00018577243971761256, + "loss": 0.9084, + "mean_token_accuracy": 0.7337997078895568, + "num_tokens": 17956464.0, + "step": 7760 + }, + { + "epoch": 0.07123865407536445, + "learning_rate": 0.0001857541028697167, + "loss": 0.8883, + "mean_token_accuracy": 0.7383899211883544, + "num_tokens": 17980429.0, + "step": 7770 + }, + { + "epoch": 0.07133033831484367, + "learning_rate": 0.00018573576602182087, + "loss": 0.8442, + "mean_token_accuracy": 0.7452596187591553, + "num_tokens": 18003751.0, + "step": 7780 + }, + { + "epoch": 0.07142202255432291, + "learning_rate": 0.000185717429173925, + "loss": 0.9186, + "mean_token_accuracy": 0.7293454945087433, + "num_tokens": 18027433.0, + "step": 7790 + }, + { + "epoch": 0.07151370679380215, + "learning_rate": 0.00018569909232602914, + "loss": 0.8958, + "mean_token_accuracy": 0.7356851279735566, + "num_tokens": 18050922.0, + "step": 7800 + }, + { + "epoch": 0.07160539103328138, + "learning_rate": 0.00018568075547813334, + "loss": 0.8912, + "mean_token_accuracy": 0.7396374762058258, + "num_tokens": 18074551.0, + "step": 7810 + }, + { + "epoch": 0.07169707527276062, + "learning_rate": 0.00018566241863023748, + "loss": 0.886, + "mean_token_accuracy": 0.7380398035049438, + "num_tokens": 18097734.0, + "step": 7820 + }, + { + "epoch": 0.07178875951223984, + "learning_rate": 0.00018564408178234164, + "loss": 0.9089, + "mean_token_accuracy": 0.7365286886692047, + "num_tokens": 18120093.0, + "step": 7830 + }, + { + "epoch": 0.07188044375171908, + "learning_rate": 0.00018562574493444578, + "loss": 0.9603, + "mean_token_accuracy": 0.718100905418396, + "num_tokens": 18144102.0, + "step": 7840 + }, + { + "epoch": 0.07197212799119831, + "learning_rate": 0.00018560740808654992, + "loss": 0.888, + "mean_token_accuracy": 0.7385085821151733, + "num_tokens": 18167554.0, + "step": 7850 + }, + { + "epoch": 0.07206381223067755, + "learning_rate": 0.00018558907123865408, + "loss": 0.8856, + "mean_token_accuracy": 0.7322841823101044, + "num_tokens": 18190684.0, + "step": 7860 + }, + { + "epoch": 0.07215549647015677, + "learning_rate": 0.00018557073439075822, + "loss": 0.9147, + "mean_token_accuracy": 0.7345363199710846, + "num_tokens": 18212828.0, + "step": 7870 + }, + { + "epoch": 0.07224718070963601, + "learning_rate": 0.0001855523975428624, + "loss": 0.9369, + "mean_token_accuracy": 0.7276594460010528, + "num_tokens": 18236208.0, + "step": 7880 + }, + { + "epoch": 0.07233886494911525, + "learning_rate": 0.00018553406069496655, + "loss": 0.886, + "mean_token_accuracy": 0.7395935773849487, + "num_tokens": 18259184.0, + "step": 7890 + }, + { + "epoch": 0.07243054918859448, + "learning_rate": 0.0001855157238470707, + "loss": 0.9038, + "mean_token_accuracy": 0.7328357338905335, + "num_tokens": 18282023.0, + "step": 7900 + }, + { + "epoch": 0.07252223342807372, + "learning_rate": 0.00018549738699917486, + "loss": 0.916, + "mean_token_accuracy": 0.7275796115398407, + "num_tokens": 18304842.0, + "step": 7910 + }, + { + "epoch": 0.07261391766755294, + "learning_rate": 0.000185479050151279, + "loss": 0.9065, + "mean_token_accuracy": 0.7362442374229431, + "num_tokens": 18328316.0, + "step": 7920 + }, + { + "epoch": 0.07270560190703218, + "learning_rate": 0.00018546071330338316, + "loss": 0.8724, + "mean_token_accuracy": 0.7417624533176422, + "num_tokens": 18350784.0, + "step": 7930 + }, + { + "epoch": 0.07279728614651142, + "learning_rate": 0.00018544237645548733, + "loss": 0.9288, + "mean_token_accuracy": 0.7282447874546051, + "num_tokens": 18373584.0, + "step": 7940 + }, + { + "epoch": 0.07288897038599065, + "learning_rate": 0.00018542403960759146, + "loss": 0.9354, + "mean_token_accuracy": 0.7260125935077667, + "num_tokens": 18396471.0, + "step": 7950 + }, + { + "epoch": 0.07298065462546988, + "learning_rate": 0.00018540570275969563, + "loss": 0.8686, + "mean_token_accuracy": 0.7401220858097076, + "num_tokens": 18419692.0, + "step": 7960 + }, + { + "epoch": 0.07307233886494911, + "learning_rate": 0.00018538736591179977, + "loss": 0.9266, + "mean_token_accuracy": 0.7221021354198456, + "num_tokens": 18443411.0, + "step": 7970 + }, + { + "epoch": 0.07316402310442835, + "learning_rate": 0.00018536902906390393, + "loss": 0.8414, + "mean_token_accuracy": 0.746176129579544, + "num_tokens": 18466740.0, + "step": 7980 + }, + { + "epoch": 0.07325570734390759, + "learning_rate": 0.00018535069221600807, + "loss": 0.9206, + "mean_token_accuracy": 0.7348521947860718, + "num_tokens": 18489677.0, + "step": 7990 + }, + { + "epoch": 0.07334739158338681, + "learning_rate": 0.0001853323553681122, + "loss": 0.8849, + "mean_token_accuracy": 0.7342815041542053, + "num_tokens": 18512294.0, + "step": 8000 + }, + { + "epoch": 0.07343907582286605, + "learning_rate": 0.0001853140185202164, + "loss": 0.8835, + "mean_token_accuracy": 0.7435256361961364, + "num_tokens": 18535164.0, + "step": 8010 + }, + { + "epoch": 0.07353076006234528, + "learning_rate": 0.00018529568167232054, + "loss": 0.872, + "mean_token_accuracy": 0.7408172130584717, + "num_tokens": 18558999.0, + "step": 8020 + }, + { + "epoch": 0.07362244430182452, + "learning_rate": 0.0001852773448244247, + "loss": 0.868, + "mean_token_accuracy": 0.7401656746864319, + "num_tokens": 18582912.0, + "step": 8030 + }, + { + "epoch": 0.07371412854130376, + "learning_rate": 0.00018525900797652884, + "loss": 0.8189, + "mean_token_accuracy": 0.7549288332462311, + "num_tokens": 18605803.0, + "step": 8040 + }, + { + "epoch": 0.07380581278078298, + "learning_rate": 0.00018524067112863298, + "loss": 0.9304, + "mean_token_accuracy": 0.7264647424221039, + "num_tokens": 18628917.0, + "step": 8050 + }, + { + "epoch": 0.07389749702026222, + "learning_rate": 0.00018522233428073715, + "loss": 0.8898, + "mean_token_accuracy": 0.7439450800418854, + "num_tokens": 18652810.0, + "step": 8060 + }, + { + "epoch": 0.07398918125974145, + "learning_rate": 0.0001852039974328413, + "loss": 0.8805, + "mean_token_accuracy": 0.7408682942390442, + "num_tokens": 18675968.0, + "step": 8070 + }, + { + "epoch": 0.07408086549922069, + "learning_rate": 0.00018518566058494545, + "loss": 0.8952, + "mean_token_accuracy": 0.733596795797348, + "num_tokens": 18698822.0, + "step": 8080 + }, + { + "epoch": 0.07417254973869991, + "learning_rate": 0.00018516732373704962, + "loss": 0.9037, + "mean_token_accuracy": 0.7288919508457183, + "num_tokens": 18721128.0, + "step": 8090 + }, + { + "epoch": 0.07426423397817915, + "learning_rate": 0.00018514898688915375, + "loss": 0.8833, + "mean_token_accuracy": 0.7353435218334198, + "num_tokens": 18744285.0, + "step": 8100 + }, + { + "epoch": 0.07435591821765838, + "learning_rate": 0.00018513065004125792, + "loss": 0.8756, + "mean_token_accuracy": 0.739633196592331, + "num_tokens": 18767682.0, + "step": 8110 + }, + { + "epoch": 0.07444760245713762, + "learning_rate": 0.00018511231319336206, + "loss": 0.8861, + "mean_token_accuracy": 0.7327218413352966, + "num_tokens": 18791529.0, + "step": 8120 + }, + { + "epoch": 0.07453928669661686, + "learning_rate": 0.00018509397634546622, + "loss": 0.8942, + "mean_token_accuracy": 0.7419546723365784, + "num_tokens": 18814752.0, + "step": 8130 + }, + { + "epoch": 0.07463097093609608, + "learning_rate": 0.0001850756394975704, + "loss": 0.8967, + "mean_token_accuracy": 0.7323192059993744, + "num_tokens": 18837598.0, + "step": 8140 + }, + { + "epoch": 0.07472265517557532, + "learning_rate": 0.00018505730264967453, + "loss": 0.8914, + "mean_token_accuracy": 0.7411729276180268, + "num_tokens": 18860319.0, + "step": 8150 + }, + { + "epoch": 0.07481433941505455, + "learning_rate": 0.0001850389658017787, + "loss": 0.8686, + "mean_token_accuracy": 0.7420401394367218, + "num_tokens": 18883411.0, + "step": 8160 + }, + { + "epoch": 0.07490602365453379, + "learning_rate": 0.00018502062895388283, + "loss": 0.9161, + "mean_token_accuracy": 0.7286843657493591, + "num_tokens": 18905727.0, + "step": 8170 + }, + { + "epoch": 0.07499770789401301, + "learning_rate": 0.000185002292105987, + "loss": 0.8704, + "mean_token_accuracy": 0.7459618389606476, + "num_tokens": 18929436.0, + "step": 8180 + }, + { + "epoch": 0.07508939213349225, + "learning_rate": 0.00018498395525809114, + "loss": 0.9291, + "mean_token_accuracy": 0.7256647884845734, + "num_tokens": 18952552.0, + "step": 8190 + }, + { + "epoch": 0.07518107637297149, + "learning_rate": 0.0001849656184101953, + "loss": 0.9214, + "mean_token_accuracy": 0.7314865827560425, + "num_tokens": 18975090.0, + "step": 8200 + }, + { + "epoch": 0.07527276061245072, + "learning_rate": 0.00018494728156229947, + "loss": 0.8783, + "mean_token_accuracy": 0.7414880692958832, + "num_tokens": 18998071.0, + "step": 8210 + }, + { + "epoch": 0.07536444485192996, + "learning_rate": 0.0001849289447144036, + "loss": 0.8938, + "mean_token_accuracy": 0.741072142124176, + "num_tokens": 19020958.0, + "step": 8220 + }, + { + "epoch": 0.07545612909140918, + "learning_rate": 0.00018491060786650777, + "loss": 0.9333, + "mean_token_accuracy": 0.7330272257328033, + "num_tokens": 19044328.0, + "step": 8230 + }, + { + "epoch": 0.07554781333088842, + "learning_rate": 0.0001848922710186119, + "loss": 0.8952, + "mean_token_accuracy": 0.7314849197864532, + "num_tokens": 19066770.0, + "step": 8240 + }, + { + "epoch": 0.07563949757036766, + "learning_rate": 0.00018487393417071605, + "loss": 0.9039, + "mean_token_accuracy": 0.7377885401248931, + "num_tokens": 19090650.0, + "step": 8250 + }, + { + "epoch": 0.07573118180984689, + "learning_rate": 0.0001848555973228202, + "loss": 0.8775, + "mean_token_accuracy": 0.7388021290302277, + "num_tokens": 19113998.0, + "step": 8260 + }, + { + "epoch": 0.07582286604932612, + "learning_rate": 0.00018483726047492438, + "loss": 0.8719, + "mean_token_accuracy": 0.7420752584934235, + "num_tokens": 19137048.0, + "step": 8270 + }, + { + "epoch": 0.07591455028880535, + "learning_rate": 0.00018481892362702852, + "loss": 0.8743, + "mean_token_accuracy": 0.7413016796112061, + "num_tokens": 19160849.0, + "step": 8280 + }, + { + "epoch": 0.07600623452828459, + "learning_rate": 0.00018480058677913268, + "loss": 0.9035, + "mean_token_accuracy": 0.7368860065937042, + "num_tokens": 19183747.0, + "step": 8290 + }, + { + "epoch": 0.07609791876776383, + "learning_rate": 0.00018478224993123682, + "loss": 0.8826, + "mean_token_accuracy": 0.741813462972641, + "num_tokens": 19207895.0, + "step": 8300 + }, + { + "epoch": 0.07618960300724305, + "learning_rate": 0.00018476391308334098, + "loss": 0.8937, + "mean_token_accuracy": 0.7364883244037628, + "num_tokens": 19231139.0, + "step": 8310 + }, + { + "epoch": 0.07628128724672228, + "learning_rate": 0.00018474557623544512, + "loss": 0.9097, + "mean_token_accuracy": 0.7353035271167755, + "num_tokens": 19254845.0, + "step": 8320 + }, + { + "epoch": 0.07637297148620152, + "learning_rate": 0.0001847272393875493, + "loss": 0.9021, + "mean_token_accuracy": 0.7364081740379333, + "num_tokens": 19278248.0, + "step": 8330 + }, + { + "epoch": 0.07646465572568076, + "learning_rate": 0.00018470890253965345, + "loss": 0.9109, + "mean_token_accuracy": 0.7344849526882171, + "num_tokens": 19300732.0, + "step": 8340 + }, + { + "epoch": 0.07655633996516, + "learning_rate": 0.0001846905656917576, + "loss": 0.9152, + "mean_token_accuracy": 0.7305308163166047, + "num_tokens": 19324322.0, + "step": 8350 + }, + { + "epoch": 0.07664802420463922, + "learning_rate": 0.00018467222884386176, + "loss": 0.9046, + "mean_token_accuracy": 0.7361734569072723, + "num_tokens": 19348400.0, + "step": 8360 + }, + { + "epoch": 0.07673970844411845, + "learning_rate": 0.0001846538919959659, + "loss": 0.9312, + "mean_token_accuracy": 0.7255568861961365, + "num_tokens": 19371307.0, + "step": 8370 + }, + { + "epoch": 0.07683139268359769, + "learning_rate": 0.00018463555514807006, + "loss": 0.8451, + "mean_token_accuracy": 0.7498118042945862, + "num_tokens": 19393832.0, + "step": 8380 + }, + { + "epoch": 0.07692307692307693, + "learning_rate": 0.0001846172183001742, + "loss": 0.9102, + "mean_token_accuracy": 0.7367885828018188, + "num_tokens": 19416290.0, + "step": 8390 + }, + { + "epoch": 0.07701476116255615, + "learning_rate": 0.00018459888145227837, + "loss": 0.8905, + "mean_token_accuracy": 0.7381061017513275, + "num_tokens": 19438403.0, + "step": 8400 + }, + { + "epoch": 0.07710644540203539, + "learning_rate": 0.00018458054460438253, + "loss": 0.8724, + "mean_token_accuracy": 0.7411992430686951, + "num_tokens": 19461862.0, + "step": 8410 + }, + { + "epoch": 0.07719812964151462, + "learning_rate": 0.00018456220775648667, + "loss": 0.848, + "mean_token_accuracy": 0.7488736093044281, + "num_tokens": 19484569.0, + "step": 8420 + }, + { + "epoch": 0.07728981388099386, + "learning_rate": 0.00018454387090859083, + "loss": 0.8825, + "mean_token_accuracy": 0.7367926299571991, + "num_tokens": 19507935.0, + "step": 8430 + }, + { + "epoch": 0.0773814981204731, + "learning_rate": 0.00018452553406069497, + "loss": 0.8891, + "mean_token_accuracy": 0.728267252445221, + "num_tokens": 19531556.0, + "step": 8440 + }, + { + "epoch": 0.07747318235995232, + "learning_rate": 0.0001845071972127991, + "loss": 0.8769, + "mean_token_accuracy": 0.737507826089859, + "num_tokens": 19554621.0, + "step": 8450 + }, + { + "epoch": 0.07756486659943156, + "learning_rate": 0.00018448886036490328, + "loss": 0.8876, + "mean_token_accuracy": 0.7386962890625, + "num_tokens": 19578394.0, + "step": 8460 + }, + { + "epoch": 0.07765655083891079, + "learning_rate": 0.00018447052351700744, + "loss": 0.8753, + "mean_token_accuracy": 0.7423336207866669, + "num_tokens": 19601913.0, + "step": 8470 + }, + { + "epoch": 0.07774823507839003, + "learning_rate": 0.00018445218666911158, + "loss": 0.9025, + "mean_token_accuracy": 0.7393895745277405, + "num_tokens": 19626183.0, + "step": 8480 + }, + { + "epoch": 0.07783991931786925, + "learning_rate": 0.00018443384982121575, + "loss": 0.8913, + "mean_token_accuracy": 0.738505357503891, + "num_tokens": 19648997.0, + "step": 8490 + }, + { + "epoch": 0.07793160355734849, + "learning_rate": 0.00018441551297331988, + "loss": 0.8809, + "mean_token_accuracy": 0.7413359463214875, + "num_tokens": 19671810.0, + "step": 8500 + }, + { + "epoch": 0.07802328779682773, + "learning_rate": 0.00018439717612542405, + "loss": 0.8657, + "mean_token_accuracy": 0.7465264201164246, + "num_tokens": 19695597.0, + "step": 8510 + }, + { + "epoch": 0.07811497203630696, + "learning_rate": 0.0001843788392775282, + "loss": 0.8899, + "mean_token_accuracy": 0.7404637336730957, + "num_tokens": 19719712.0, + "step": 8520 + }, + { + "epoch": 0.0782066562757862, + "learning_rate": 0.00018436050242963235, + "loss": 0.9133, + "mean_token_accuracy": 0.7294314622879028, + "num_tokens": 19742476.0, + "step": 8530 + }, + { + "epoch": 0.07829834051526542, + "learning_rate": 0.00018434216558173652, + "loss": 0.8523, + "mean_token_accuracy": 0.7467393636703491, + "num_tokens": 19766150.0, + "step": 8540 + }, + { + "epoch": 0.07839002475474466, + "learning_rate": 0.00018432382873384066, + "loss": 0.8754, + "mean_token_accuracy": 0.741338175535202, + "num_tokens": 19788595.0, + "step": 8550 + }, + { + "epoch": 0.0784817089942239, + "learning_rate": 0.00018430549188594482, + "loss": 0.9201, + "mean_token_accuracy": 0.7328977167606354, + "num_tokens": 19811650.0, + "step": 8560 + }, + { + "epoch": 0.07857339323370313, + "learning_rate": 0.00018428715503804896, + "loss": 0.9023, + "mean_token_accuracy": 0.7369591057300567, + "num_tokens": 19835189.0, + "step": 8570 + }, + { + "epoch": 0.07866507747318235, + "learning_rate": 0.00018426881819015313, + "loss": 0.8898, + "mean_token_accuracy": 0.7325446903705597, + "num_tokens": 19857559.0, + "step": 8580 + }, + { + "epoch": 0.07875676171266159, + "learning_rate": 0.00018425048134225726, + "loss": 0.8951, + "mean_token_accuracy": 0.7413085997104645, + "num_tokens": 19880426.0, + "step": 8590 + }, + { + "epoch": 0.07884844595214083, + "learning_rate": 0.00018423214449436143, + "loss": 0.8995, + "mean_token_accuracy": 0.735448557138443, + "num_tokens": 19903141.0, + "step": 8600 + }, + { + "epoch": 0.07894013019162006, + "learning_rate": 0.0001842138076464656, + "loss": 0.8479, + "mean_token_accuracy": 0.7454135417938232, + "num_tokens": 19926504.0, + "step": 8610 + }, + { + "epoch": 0.0790318144310993, + "learning_rate": 0.00018419547079856973, + "loss": 0.8897, + "mean_token_accuracy": 0.7353550672531128, + "num_tokens": 19950113.0, + "step": 8620 + }, + { + "epoch": 0.07912349867057852, + "learning_rate": 0.0001841771339506739, + "loss": 0.867, + "mean_token_accuracy": 0.7345813035964965, + "num_tokens": 19974333.0, + "step": 8630 + }, + { + "epoch": 0.07921518291005776, + "learning_rate": 0.00018415879710277804, + "loss": 0.8743, + "mean_token_accuracy": 0.7420864105224609, + "num_tokens": 19996898.0, + "step": 8640 + }, + { + "epoch": 0.079306867149537, + "learning_rate": 0.00018414046025488218, + "loss": 0.8682, + "mean_token_accuracy": 0.7440168380737304, + "num_tokens": 20019741.0, + "step": 8650 + }, + { + "epoch": 0.07939855138901623, + "learning_rate": 0.00018412212340698637, + "loss": 0.9167, + "mean_token_accuracy": 0.7251489818096161, + "num_tokens": 20042555.0, + "step": 8660 + }, + { + "epoch": 0.07949023562849546, + "learning_rate": 0.0001841037865590905, + "loss": 0.8747, + "mean_token_accuracy": 0.744568943977356, + "num_tokens": 20066376.0, + "step": 8670 + }, + { + "epoch": 0.0795819198679747, + "learning_rate": 0.00018408544971119464, + "loss": 0.9263, + "mean_token_accuracy": 0.7316726863384246, + "num_tokens": 20089115.0, + "step": 8680 + }, + { + "epoch": 0.07967360410745393, + "learning_rate": 0.0001840671128632988, + "loss": 0.8645, + "mean_token_accuracy": 0.735486525297165, + "num_tokens": 20112260.0, + "step": 8690 + }, + { + "epoch": 0.07976528834693317, + "learning_rate": 0.00018404877601540295, + "loss": 0.8894, + "mean_token_accuracy": 0.7351312339305878, + "num_tokens": 20135132.0, + "step": 8700 + }, + { + "epoch": 0.07985697258641239, + "learning_rate": 0.00018403043916750711, + "loss": 0.8826, + "mean_token_accuracy": 0.7413839042186737, + "num_tokens": 20157358.0, + "step": 8710 + }, + { + "epoch": 0.07994865682589163, + "learning_rate": 0.00018401210231961125, + "loss": 0.9046, + "mean_token_accuracy": 0.7350801885128021, + "num_tokens": 20181209.0, + "step": 8720 + }, + { + "epoch": 0.08004034106537086, + "learning_rate": 0.00018399376547171542, + "loss": 0.8739, + "mean_token_accuracy": 0.7423152804374695, + "num_tokens": 20204229.0, + "step": 8730 + }, + { + "epoch": 0.0801320253048501, + "learning_rate": 0.00018397542862381958, + "loss": 0.8953, + "mean_token_accuracy": 0.7356089353561401, + "num_tokens": 20227928.0, + "step": 8740 + }, + { + "epoch": 0.08022370954432934, + "learning_rate": 0.00018395709177592372, + "loss": 0.9026, + "mean_token_accuracy": 0.7324627876281739, + "num_tokens": 20250216.0, + "step": 8750 + }, + { + "epoch": 0.08031539378380856, + "learning_rate": 0.0001839387549280279, + "loss": 0.9058, + "mean_token_accuracy": 0.7393997013568878, + "num_tokens": 20272232.0, + "step": 8760 + }, + { + "epoch": 0.0804070780232878, + "learning_rate": 0.00018392041808013202, + "loss": 0.8813, + "mean_token_accuracy": 0.7367434084415436, + "num_tokens": 20295550.0, + "step": 8770 + }, + { + "epoch": 0.08049876226276703, + "learning_rate": 0.0001839020812322362, + "loss": 0.9454, + "mean_token_accuracy": 0.7237827122211457, + "num_tokens": 20318767.0, + "step": 8780 + }, + { + "epoch": 0.08059044650224627, + "learning_rate": 0.00018388374438434036, + "loss": 0.9218, + "mean_token_accuracy": 0.7363382518291474, + "num_tokens": 20341763.0, + "step": 8790 + }, + { + "epoch": 0.08068213074172549, + "learning_rate": 0.0001838654075364445, + "loss": 0.9096, + "mean_token_accuracy": 0.7324922680854797, + "num_tokens": 20364896.0, + "step": 8800 + }, + { + "epoch": 0.08077381498120473, + "learning_rate": 0.00018384707068854866, + "loss": 0.896, + "mean_token_accuracy": 0.7368214428424835, + "num_tokens": 20387231.0, + "step": 8810 + }, + { + "epoch": 0.08086549922068396, + "learning_rate": 0.0001838287338406528, + "loss": 0.8796, + "mean_token_accuracy": 0.7440318286418914, + "num_tokens": 20411114.0, + "step": 8820 + }, + { + "epoch": 0.0809571834601632, + "learning_rate": 0.00018381039699275696, + "loss": 0.9121, + "mean_token_accuracy": 0.7343628704547882, + "num_tokens": 20434243.0, + "step": 8830 + }, + { + "epoch": 0.08104886769964244, + "learning_rate": 0.0001837920601448611, + "loss": 0.9109, + "mean_token_accuracy": 0.7294663310050964, + "num_tokens": 20457325.0, + "step": 8840 + }, + { + "epoch": 0.08114055193912166, + "learning_rate": 0.00018377372329696524, + "loss": 0.885, + "mean_token_accuracy": 0.7388871312141418, + "num_tokens": 20480852.0, + "step": 8850 + }, + { + "epoch": 0.0812322361786009, + "learning_rate": 0.00018375538644906943, + "loss": 0.859, + "mean_token_accuracy": 0.7362000644207001, + "num_tokens": 20504421.0, + "step": 8860 + }, + { + "epoch": 0.08132392041808013, + "learning_rate": 0.00018373704960117357, + "loss": 0.8667, + "mean_token_accuracy": 0.7418944597244262, + "num_tokens": 20527108.0, + "step": 8870 + }, + { + "epoch": 0.08141560465755937, + "learning_rate": 0.0001837187127532777, + "loss": 0.8593, + "mean_token_accuracy": 0.7480157673358917, + "num_tokens": 20550605.0, + "step": 8880 + }, + { + "epoch": 0.0815072888970386, + "learning_rate": 0.00018370037590538187, + "loss": 0.9114, + "mean_token_accuracy": 0.7304875373840332, + "num_tokens": 20573090.0, + "step": 8890 + }, + { + "epoch": 0.08159897313651783, + "learning_rate": 0.000183682039057486, + "loss": 0.8376, + "mean_token_accuracy": 0.745467746257782, + "num_tokens": 20596228.0, + "step": 8900 + }, + { + "epoch": 0.08169065737599707, + "learning_rate": 0.00018366370220959018, + "loss": 0.8848, + "mean_token_accuracy": 0.7430700659751892, + "num_tokens": 20618943.0, + "step": 8910 + }, + { + "epoch": 0.0817823416154763, + "learning_rate": 0.00018364536536169434, + "loss": 0.9316, + "mean_token_accuracy": 0.7364117920398712, + "num_tokens": 20641169.0, + "step": 8920 + }, + { + "epoch": 0.08187402585495554, + "learning_rate": 0.00018362702851379848, + "loss": 0.8253, + "mean_token_accuracy": 0.7549974143505096, + "num_tokens": 20664607.0, + "step": 8930 + }, + { + "epoch": 0.08196571009443476, + "learning_rate": 0.00018360869166590265, + "loss": 0.8802, + "mean_token_accuracy": 0.7424738585948945, + "num_tokens": 20687667.0, + "step": 8940 + }, + { + "epoch": 0.082057394333914, + "learning_rate": 0.00018359035481800679, + "loss": 0.8875, + "mean_token_accuracy": 0.738900226354599, + "num_tokens": 20710902.0, + "step": 8950 + }, + { + "epoch": 0.08214907857339324, + "learning_rate": 0.00018357201797011095, + "loss": 0.8374, + "mean_token_accuracy": 0.7451739192008973, + "num_tokens": 20734252.0, + "step": 8960 + }, + { + "epoch": 0.08224076281287247, + "learning_rate": 0.0001835536811222151, + "loss": 0.8889, + "mean_token_accuracy": 0.7412276923656463, + "num_tokens": 20756954.0, + "step": 8970 + }, + { + "epoch": 0.0823324470523517, + "learning_rate": 0.00018353534427431925, + "loss": 0.8668, + "mean_token_accuracy": 0.7402545034885406, + "num_tokens": 20779877.0, + "step": 8980 + }, + { + "epoch": 0.08242413129183093, + "learning_rate": 0.00018351700742642342, + "loss": 0.8855, + "mean_token_accuracy": 0.7334759831428528, + "num_tokens": 20802755.0, + "step": 8990 + }, + { + "epoch": 0.08251581553131017, + "learning_rate": 0.00018349867057852756, + "loss": 0.8862, + "mean_token_accuracy": 0.7427118003368378, + "num_tokens": 20826197.0, + "step": 9000 + }, + { + "epoch": 0.0826074997707894, + "learning_rate": 0.00018348033373063172, + "loss": 0.9096, + "mean_token_accuracy": 0.7359176874160767, + "num_tokens": 20848927.0, + "step": 9010 + }, + { + "epoch": 0.08269918401026863, + "learning_rate": 0.00018346199688273586, + "loss": 0.8515, + "mean_token_accuracy": 0.7440576672554016, + "num_tokens": 20871663.0, + "step": 9020 + }, + { + "epoch": 0.08279086824974786, + "learning_rate": 0.00018344366003484003, + "loss": 0.9031, + "mean_token_accuracy": 0.7336151599884033, + "num_tokens": 20894820.0, + "step": 9030 + }, + { + "epoch": 0.0828825524892271, + "learning_rate": 0.00018342532318694417, + "loss": 0.8684, + "mean_token_accuracy": 0.7430043578147888, + "num_tokens": 20917421.0, + "step": 9040 + }, + { + "epoch": 0.08297423672870634, + "learning_rate": 0.00018340698633904833, + "loss": 0.875, + "mean_token_accuracy": 0.7408009827136993, + "num_tokens": 20940502.0, + "step": 9050 + }, + { + "epoch": 0.08306592096818557, + "learning_rate": 0.0001833886494911525, + "loss": 0.8969, + "mean_token_accuracy": 0.7269556581974029, + "num_tokens": 20963538.0, + "step": 9060 + }, + { + "epoch": 0.0831576052076648, + "learning_rate": 0.00018337031264325664, + "loss": 0.9083, + "mean_token_accuracy": 0.7323137760162354, + "num_tokens": 20986338.0, + "step": 9070 + }, + { + "epoch": 0.08324928944714403, + "learning_rate": 0.00018335197579536077, + "loss": 0.8996, + "mean_token_accuracy": 0.7331121683120727, + "num_tokens": 21010087.0, + "step": 9080 + }, + { + "epoch": 0.08334097368662327, + "learning_rate": 0.00018333363894746494, + "loss": 0.864, + "mean_token_accuracy": 0.7416777074337005, + "num_tokens": 21033354.0, + "step": 9090 + }, + { + "epoch": 0.08343265792610251, + "learning_rate": 0.00018331530209956908, + "loss": 0.8994, + "mean_token_accuracy": 0.730178689956665, + "num_tokens": 21056357.0, + "step": 9100 + }, + { + "epoch": 0.08352434216558173, + "learning_rate": 0.00018329696525167324, + "loss": 0.8907, + "mean_token_accuracy": 0.7331460475921631, + "num_tokens": 21079081.0, + "step": 9110 + }, + { + "epoch": 0.08361602640506097, + "learning_rate": 0.0001832786284037774, + "loss": 0.873, + "mean_token_accuracy": 0.7385563969612121, + "num_tokens": 21102943.0, + "step": 9120 + }, + { + "epoch": 0.0837077106445402, + "learning_rate": 0.00018326029155588155, + "loss": 0.8868, + "mean_token_accuracy": 0.7314861476421356, + "num_tokens": 21126669.0, + "step": 9130 + }, + { + "epoch": 0.08379939488401944, + "learning_rate": 0.0001832419547079857, + "loss": 0.8772, + "mean_token_accuracy": 0.7403957903385162, + "num_tokens": 21149283.0, + "step": 9140 + }, + { + "epoch": 0.08389107912349868, + "learning_rate": 0.00018322361786008985, + "loss": 0.916, + "mean_token_accuracy": 0.7340789377689362, + "num_tokens": 21171927.0, + "step": 9150 + }, + { + "epoch": 0.0839827633629779, + "learning_rate": 0.00018320528101219402, + "loss": 0.8674, + "mean_token_accuracy": 0.7459503710269928, + "num_tokens": 21194580.0, + "step": 9160 + }, + { + "epoch": 0.08407444760245714, + "learning_rate": 0.00018318694416429815, + "loss": 0.8805, + "mean_token_accuracy": 0.7379239141941071, + "num_tokens": 21217462.0, + "step": 9170 + }, + { + "epoch": 0.08416613184193637, + "learning_rate": 0.00018316860731640232, + "loss": 0.9298, + "mean_token_accuracy": 0.7346334517002105, + "num_tokens": 21240716.0, + "step": 9180 + }, + { + "epoch": 0.08425781608141561, + "learning_rate": 0.00018315027046850648, + "loss": 0.8791, + "mean_token_accuracy": 0.735994029045105, + "num_tokens": 21264109.0, + "step": 9190 + }, + { + "epoch": 0.08434950032089483, + "learning_rate": 0.00018313193362061062, + "loss": 0.9068, + "mean_token_accuracy": 0.734699672460556, + "num_tokens": 21287737.0, + "step": 9200 + }, + { + "epoch": 0.08444118456037407, + "learning_rate": 0.0001831135967727148, + "loss": 0.8664, + "mean_token_accuracy": 0.7357621252536773, + "num_tokens": 21311051.0, + "step": 9210 + }, + { + "epoch": 0.0845328687998533, + "learning_rate": 0.00018309525992481893, + "loss": 0.8606, + "mean_token_accuracy": 0.7430299639701843, + "num_tokens": 21334874.0, + "step": 9220 + }, + { + "epoch": 0.08462455303933254, + "learning_rate": 0.0001830769230769231, + "loss": 0.9054, + "mean_token_accuracy": 0.7372971832752228, + "num_tokens": 21358174.0, + "step": 9230 + }, + { + "epoch": 0.08471623727881178, + "learning_rate": 0.00018305858622902723, + "loss": 0.8813, + "mean_token_accuracy": 0.7368301928043366, + "num_tokens": 21382025.0, + "step": 9240 + }, + { + "epoch": 0.084807921518291, + "learning_rate": 0.0001830402493811314, + "loss": 0.8823, + "mean_token_accuracy": 0.7336306691169738, + "num_tokens": 21404632.0, + "step": 9250 + }, + { + "epoch": 0.08489960575777024, + "learning_rate": 0.00018302191253323556, + "loss": 0.8547, + "mean_token_accuracy": 0.7515554547309875, + "num_tokens": 21428131.0, + "step": 9260 + }, + { + "epoch": 0.08499128999724948, + "learning_rate": 0.0001830035756853397, + "loss": 0.8745, + "mean_token_accuracy": 0.7392058372497559, + "num_tokens": 21451432.0, + "step": 9270 + }, + { + "epoch": 0.08508297423672871, + "learning_rate": 0.00018298523883744384, + "loss": 0.8871, + "mean_token_accuracy": 0.7410492539405823, + "num_tokens": 21474230.0, + "step": 9280 + }, + { + "epoch": 0.08517465847620793, + "learning_rate": 0.000182966901989548, + "loss": 0.9153, + "mean_token_accuracy": 0.7351513147354126, + "num_tokens": 21497153.0, + "step": 9290 + }, + { + "epoch": 0.08526634271568717, + "learning_rate": 0.00018294856514165214, + "loss": 0.8844, + "mean_token_accuracy": 0.7379489421844483, + "num_tokens": 21520721.0, + "step": 9300 + }, + { + "epoch": 0.08535802695516641, + "learning_rate": 0.00018293022829375633, + "loss": 0.8737, + "mean_token_accuracy": 0.7409141719341278, + "num_tokens": 21543904.0, + "step": 9310 + }, + { + "epoch": 0.08544971119464564, + "learning_rate": 0.00018291189144586047, + "loss": 0.8947, + "mean_token_accuracy": 0.7339003920555115, + "num_tokens": 21566753.0, + "step": 9320 + }, + { + "epoch": 0.08554139543412487, + "learning_rate": 0.0001828935545979646, + "loss": 0.8979, + "mean_token_accuracy": 0.7357079029083252, + "num_tokens": 21590527.0, + "step": 9330 + }, + { + "epoch": 0.0856330796736041, + "learning_rate": 0.00018287521775006878, + "loss": 0.874, + "mean_token_accuracy": 0.7461161673069, + "num_tokens": 21613767.0, + "step": 9340 + }, + { + "epoch": 0.08572476391308334, + "learning_rate": 0.00018285688090217291, + "loss": 0.8909, + "mean_token_accuracy": 0.7372100174427032, + "num_tokens": 21637037.0, + "step": 9350 + }, + { + "epoch": 0.08581644815256258, + "learning_rate": 0.00018283854405427708, + "loss": 0.9097, + "mean_token_accuracy": 0.7302749633789063, + "num_tokens": 21660356.0, + "step": 9360 + }, + { + "epoch": 0.08590813239204181, + "learning_rate": 0.00018282020720638122, + "loss": 0.8847, + "mean_token_accuracy": 0.7322764992713928, + "num_tokens": 21683097.0, + "step": 9370 + }, + { + "epoch": 0.08599981663152104, + "learning_rate": 0.00018280187035848538, + "loss": 0.9033, + "mean_token_accuracy": 0.7378346085548401, + "num_tokens": 21705375.0, + "step": 9380 + }, + { + "epoch": 0.08609150087100027, + "learning_rate": 0.00018278353351058955, + "loss": 0.8736, + "mean_token_accuracy": 0.7481322288513184, + "num_tokens": 21728893.0, + "step": 9390 + }, + { + "epoch": 0.08618318511047951, + "learning_rate": 0.0001827651966626937, + "loss": 0.9172, + "mean_token_accuracy": 0.7349271535873413, + "num_tokens": 21751697.0, + "step": 9400 + }, + { + "epoch": 0.08627486934995875, + "learning_rate": 0.00018274685981479785, + "loss": 0.86, + "mean_token_accuracy": 0.7382111191749573, + "num_tokens": 21774770.0, + "step": 9410 + }, + { + "epoch": 0.08636655358943797, + "learning_rate": 0.000182728522966902, + "loss": 0.9093, + "mean_token_accuracy": 0.733877283334732, + "num_tokens": 21796772.0, + "step": 9420 + }, + { + "epoch": 0.0864582378289172, + "learning_rate": 0.00018271018611900616, + "loss": 0.8818, + "mean_token_accuracy": 0.742811793088913, + "num_tokens": 21820725.0, + "step": 9430 + }, + { + "epoch": 0.08654992206839644, + "learning_rate": 0.00018269184927111032, + "loss": 0.896, + "mean_token_accuracy": 0.7337358832359314, + "num_tokens": 21843697.0, + "step": 9440 + }, + { + "epoch": 0.08664160630787568, + "learning_rate": 0.00018267351242321446, + "loss": 0.8616, + "mean_token_accuracy": 0.7448089361190796, + "num_tokens": 21866861.0, + "step": 9450 + }, + { + "epoch": 0.08673329054735492, + "learning_rate": 0.00018265517557531863, + "loss": 0.8978, + "mean_token_accuracy": 0.7339885711669922, + "num_tokens": 21889922.0, + "step": 9460 + }, + { + "epoch": 0.08682497478683414, + "learning_rate": 0.00018263683872742276, + "loss": 0.9258, + "mean_token_accuracy": 0.7256360352039337, + "num_tokens": 21912965.0, + "step": 9470 + }, + { + "epoch": 0.08691665902631338, + "learning_rate": 0.0001826185018795269, + "loss": 0.8548, + "mean_token_accuracy": 0.7446251630783081, + "num_tokens": 21936199.0, + "step": 9480 + }, + { + "epoch": 0.08700834326579261, + "learning_rate": 0.00018260016503163107, + "loss": 0.9191, + "mean_token_accuracy": 0.732340258359909, + "num_tokens": 21958595.0, + "step": 9490 + }, + { + "epoch": 0.08710002750527185, + "learning_rate": 0.0001825818281837352, + "loss": 0.8636, + "mean_token_accuracy": 0.7465512156486511, + "num_tokens": 21981051.0, + "step": 9500 + }, + { + "epoch": 0.08719171174475107, + "learning_rate": 0.0001825634913358394, + "loss": 0.8792, + "mean_token_accuracy": 0.733728039264679, + "num_tokens": 22004657.0, + "step": 9510 + }, + { + "epoch": 0.08728339598423031, + "learning_rate": 0.00018254515448794354, + "loss": 0.9001, + "mean_token_accuracy": 0.7300061106681823, + "num_tokens": 22027822.0, + "step": 9520 + }, + { + "epoch": 0.08737508022370954, + "learning_rate": 0.00018252681764004768, + "loss": 0.8689, + "mean_token_accuracy": 0.745732969045639, + "num_tokens": 22051033.0, + "step": 9530 + }, + { + "epoch": 0.08746676446318878, + "learning_rate": 0.00018250848079215184, + "loss": 0.88, + "mean_token_accuracy": 0.7341371715068817, + "num_tokens": 22074337.0, + "step": 9540 + }, + { + "epoch": 0.08755844870266802, + "learning_rate": 0.00018249014394425598, + "loss": 0.9054, + "mean_token_accuracy": 0.734076589345932, + "num_tokens": 22096998.0, + "step": 9550 + }, + { + "epoch": 0.08765013294214724, + "learning_rate": 0.00018247180709636014, + "loss": 0.874, + "mean_token_accuracy": 0.7426896154880523, + "num_tokens": 22119842.0, + "step": 9560 + }, + { + "epoch": 0.08774181718162648, + "learning_rate": 0.0001824534702484643, + "loss": 0.8793, + "mean_token_accuracy": 0.7316954851150512, + "num_tokens": 22142707.0, + "step": 9570 + }, + { + "epoch": 0.08783350142110571, + "learning_rate": 0.00018243513340056845, + "loss": 0.8868, + "mean_token_accuracy": 0.7348066747188569, + "num_tokens": 22166344.0, + "step": 9580 + }, + { + "epoch": 0.08792518566058495, + "learning_rate": 0.00018241679655267261, + "loss": 0.8568, + "mean_token_accuracy": 0.744666600227356, + "num_tokens": 22188550.0, + "step": 9590 + }, + { + "epoch": 0.08801686990006417, + "learning_rate": 0.00018239845970477675, + "loss": 0.8764, + "mean_token_accuracy": 0.7450824737548828, + "num_tokens": 22211255.0, + "step": 9600 + }, + { + "epoch": 0.08810855413954341, + "learning_rate": 0.00018238012285688092, + "loss": 0.9055, + "mean_token_accuracy": 0.7375835120677948, + "num_tokens": 22234451.0, + "step": 9610 + }, + { + "epoch": 0.08820023837902265, + "learning_rate": 0.00018236178600898506, + "loss": 0.8869, + "mean_token_accuracy": 0.7426702976226807, + "num_tokens": 22257234.0, + "step": 9620 + }, + { + "epoch": 0.08829192261850188, + "learning_rate": 0.00018234344916108922, + "loss": 0.8714, + "mean_token_accuracy": 0.746830689907074, + "num_tokens": 22280204.0, + "step": 9630 + }, + { + "epoch": 0.0883836068579811, + "learning_rate": 0.0001823251123131934, + "loss": 0.8792, + "mean_token_accuracy": 0.7361852407455445, + "num_tokens": 22304714.0, + "step": 9640 + }, + { + "epoch": 0.08847529109746034, + "learning_rate": 0.00018230677546529752, + "loss": 0.9159, + "mean_token_accuracy": 0.732985931634903, + "num_tokens": 22327734.0, + "step": 9650 + }, + { + "epoch": 0.08856697533693958, + "learning_rate": 0.0001822884386174017, + "loss": 0.8742, + "mean_token_accuracy": 0.7432840228080749, + "num_tokens": 22350796.0, + "step": 9660 + }, + { + "epoch": 0.08865865957641882, + "learning_rate": 0.00018227010176950583, + "loss": 0.8694, + "mean_token_accuracy": 0.7500789582729339, + "num_tokens": 22374105.0, + "step": 9670 + }, + { + "epoch": 0.08875034381589805, + "learning_rate": 0.00018225176492160997, + "loss": 0.9417, + "mean_token_accuracy": 0.7292441070079804, + "num_tokens": 22397321.0, + "step": 9680 + }, + { + "epoch": 0.08884202805537728, + "learning_rate": 0.00018223342807371413, + "loss": 0.855, + "mean_token_accuracy": 0.7461090803146362, + "num_tokens": 22420772.0, + "step": 9690 + }, + { + "epoch": 0.08893371229485651, + "learning_rate": 0.00018221509122581827, + "loss": 0.8963, + "mean_token_accuracy": 0.7368881940841675, + "num_tokens": 22443852.0, + "step": 9700 + }, + { + "epoch": 0.08902539653433575, + "learning_rate": 0.00018219675437792246, + "loss": 0.9074, + "mean_token_accuracy": 0.7292484223842621, + "num_tokens": 22467109.0, + "step": 9710 + }, + { + "epoch": 0.08911708077381499, + "learning_rate": 0.0001821784175300266, + "loss": 0.8251, + "mean_token_accuracy": 0.7499877512454987, + "num_tokens": 22490388.0, + "step": 9720 + }, + { + "epoch": 0.08920876501329421, + "learning_rate": 0.00018216008068213074, + "loss": 0.8924, + "mean_token_accuracy": 0.7306248307228088, + "num_tokens": 22513923.0, + "step": 9730 + }, + { + "epoch": 0.08930044925277345, + "learning_rate": 0.0001821417438342349, + "loss": 0.9283, + "mean_token_accuracy": 0.7331124186515808, + "num_tokens": 22537418.0, + "step": 9740 + }, + { + "epoch": 0.08939213349225268, + "learning_rate": 0.00018212340698633904, + "loss": 0.8983, + "mean_token_accuracy": 0.7407335758209228, + "num_tokens": 22560079.0, + "step": 9750 + }, + { + "epoch": 0.08948381773173192, + "learning_rate": 0.0001821050701384432, + "loss": 0.873, + "mean_token_accuracy": 0.7470311105251313, + "num_tokens": 22582433.0, + "step": 9760 + }, + { + "epoch": 0.08957550197121115, + "learning_rate": 0.00018208673329054737, + "loss": 0.8609, + "mean_token_accuracy": 0.7422303915023803, + "num_tokens": 22605173.0, + "step": 9770 + }, + { + "epoch": 0.08966718621069038, + "learning_rate": 0.0001820683964426515, + "loss": 0.8944, + "mean_token_accuracy": 0.7427703142166138, + "num_tokens": 22627989.0, + "step": 9780 + }, + { + "epoch": 0.08975887045016961, + "learning_rate": 0.00018205005959475568, + "loss": 0.8471, + "mean_token_accuracy": 0.7471030592918396, + "num_tokens": 22650742.0, + "step": 9790 + }, + { + "epoch": 0.08985055468964885, + "learning_rate": 0.00018203172274685982, + "loss": 0.8523, + "mean_token_accuracy": 0.7479526579380036, + "num_tokens": 22673623.0, + "step": 9800 + }, + { + "epoch": 0.08994223892912809, + "learning_rate": 0.00018201338589896398, + "loss": 0.8416, + "mean_token_accuracy": 0.7459315598011017, + "num_tokens": 22696704.0, + "step": 9810 + }, + { + "epoch": 0.09003392316860731, + "learning_rate": 0.00018199504905106812, + "loss": 0.9011, + "mean_token_accuracy": 0.7355086147785187, + "num_tokens": 22720122.0, + "step": 9820 + }, + { + "epoch": 0.09012560740808655, + "learning_rate": 0.00018197671220317229, + "loss": 0.9328, + "mean_token_accuracy": 0.7215277791023255, + "num_tokens": 22742374.0, + "step": 9830 + }, + { + "epoch": 0.09021729164756578, + "learning_rate": 0.00018195837535527645, + "loss": 0.9456, + "mean_token_accuracy": 0.7291106104850769, + "num_tokens": 22765871.0, + "step": 9840 + }, + { + "epoch": 0.09030897588704502, + "learning_rate": 0.0001819400385073806, + "loss": 0.8719, + "mean_token_accuracy": 0.7470474421977997, + "num_tokens": 22788967.0, + "step": 9850 + }, + { + "epoch": 0.09040066012652426, + "learning_rate": 0.00018192170165948475, + "loss": 0.8991, + "mean_token_accuracy": 0.7358954310417175, + "num_tokens": 22811479.0, + "step": 9860 + }, + { + "epoch": 0.09049234436600348, + "learning_rate": 0.0001819033648115889, + "loss": 0.8698, + "mean_token_accuracy": 0.7358669996261596, + "num_tokens": 22834308.0, + "step": 9870 + }, + { + "epoch": 0.09058402860548272, + "learning_rate": 0.00018188502796369303, + "loss": 0.9043, + "mean_token_accuracy": 0.7353496193885803, + "num_tokens": 22857743.0, + "step": 9880 + }, + { + "epoch": 0.09067571284496195, + "learning_rate": 0.0001818666911157972, + "loss": 0.8446, + "mean_token_accuracy": 0.7453127682209015, + "num_tokens": 22880218.0, + "step": 9890 + }, + { + "epoch": 0.09076739708444119, + "learning_rate": 0.00018184835426790136, + "loss": 0.8724, + "mean_token_accuracy": 0.7360309422016144, + "num_tokens": 22903463.0, + "step": 9900 + }, + { + "epoch": 0.09085908132392041, + "learning_rate": 0.00018183001742000553, + "loss": 0.8704, + "mean_token_accuracy": 0.7368826031684875, + "num_tokens": 22926125.0, + "step": 9910 + }, + { + "epoch": 0.09095076556339965, + "learning_rate": 0.00018181168057210967, + "loss": 0.8731, + "mean_token_accuracy": 0.7351884782314301, + "num_tokens": 22949921.0, + "step": 9920 + }, + { + "epoch": 0.09104244980287889, + "learning_rate": 0.0001817933437242138, + "loss": 0.9423, + "mean_token_accuracy": 0.7227811276912689, + "num_tokens": 22973397.0, + "step": 9930 + }, + { + "epoch": 0.09113413404235812, + "learning_rate": 0.00018177500687631797, + "loss": 0.8663, + "mean_token_accuracy": 0.7420787274837494, + "num_tokens": 22996340.0, + "step": 9940 + }, + { + "epoch": 0.09122581828183735, + "learning_rate": 0.0001817566700284221, + "loss": 0.8551, + "mean_token_accuracy": 0.746318656206131, + "num_tokens": 23018876.0, + "step": 9950 + }, + { + "epoch": 0.09131750252131658, + "learning_rate": 0.00018173833318052627, + "loss": 0.9181, + "mean_token_accuracy": 0.7355397641658783, + "num_tokens": 23041450.0, + "step": 9960 + }, + { + "epoch": 0.09140918676079582, + "learning_rate": 0.00018171999633263044, + "loss": 0.8854, + "mean_token_accuracy": 0.7342116951942443, + "num_tokens": 23064800.0, + "step": 9970 + }, + { + "epoch": 0.09150087100027506, + "learning_rate": 0.00018170165948473458, + "loss": 0.8047, + "mean_token_accuracy": 0.7571393847465515, + "num_tokens": 23087381.0, + "step": 9980 + }, + { + "epoch": 0.09159255523975429, + "learning_rate": 0.00018168332263683874, + "loss": 0.9063, + "mean_token_accuracy": 0.7324288666248322, + "num_tokens": 23110734.0, + "step": 9990 + }, + { + "epoch": 0.09168423947923351, + "learning_rate": 0.00018166498578894288, + "loss": 0.9023, + "mean_token_accuracy": 0.7366482257843018, + "num_tokens": 23133633.0, + "step": 10000 + }, + { + "epoch": 0.09177592371871275, + "learning_rate": 0.00018164664894104705, + "loss": 0.901, + "mean_token_accuracy": 0.7339980900287628, + "num_tokens": 23156919.0, + "step": 10010 + }, + { + "epoch": 0.09186760795819199, + "learning_rate": 0.00018162831209315118, + "loss": 0.909, + "mean_token_accuracy": 0.7299727261066437, + "num_tokens": 23180293.0, + "step": 10020 + }, + { + "epoch": 0.09195929219767122, + "learning_rate": 0.00018160997524525535, + "loss": 0.8927, + "mean_token_accuracy": 0.740869790315628, + "num_tokens": 23203594.0, + "step": 10030 + }, + { + "epoch": 0.09205097643715045, + "learning_rate": 0.00018159163839735952, + "loss": 0.8973, + "mean_token_accuracy": 0.7331617951393128, + "num_tokens": 23225983.0, + "step": 10040 + }, + { + "epoch": 0.09214266067662968, + "learning_rate": 0.00018157330154946365, + "loss": 0.9039, + "mean_token_accuracy": 0.7249781310558319, + "num_tokens": 23248764.0, + "step": 10050 + }, + { + "epoch": 0.09223434491610892, + "learning_rate": 0.00018155496470156782, + "loss": 0.9008, + "mean_token_accuracy": 0.7372535169124603, + "num_tokens": 23271310.0, + "step": 10060 + }, + { + "epoch": 0.09232602915558816, + "learning_rate": 0.00018153662785367196, + "loss": 0.9034, + "mean_token_accuracy": 0.7302026450634003, + "num_tokens": 23293634.0, + "step": 10070 + }, + { + "epoch": 0.0924177133950674, + "learning_rate": 0.0001815182910057761, + "loss": 0.875, + "mean_token_accuracy": 0.7396530449390412, + "num_tokens": 23316858.0, + "step": 10080 + }, + { + "epoch": 0.09250939763454662, + "learning_rate": 0.00018149995415788026, + "loss": 0.8783, + "mean_token_accuracy": 0.7374988317489624, + "num_tokens": 23339146.0, + "step": 10090 + }, + { + "epoch": 0.09260108187402585, + "learning_rate": 0.00018148161730998443, + "loss": 0.8557, + "mean_token_accuracy": 0.7460222184658051, + "num_tokens": 23363154.0, + "step": 10100 + }, + { + "epoch": 0.09269276611350509, + "learning_rate": 0.0001814632804620886, + "loss": 0.9, + "mean_token_accuracy": 0.7356420278549194, + "num_tokens": 23386881.0, + "step": 10110 + }, + { + "epoch": 0.09278445035298433, + "learning_rate": 0.00018144494361419273, + "loss": 0.8941, + "mean_token_accuracy": 0.7426242411136628, + "num_tokens": 23409505.0, + "step": 10120 + }, + { + "epoch": 0.09287613459246355, + "learning_rate": 0.00018142660676629687, + "loss": 0.8851, + "mean_token_accuracy": 0.7426791250705719, + "num_tokens": 23432008.0, + "step": 10130 + }, + { + "epoch": 0.09296781883194279, + "learning_rate": 0.00018140826991840103, + "loss": 0.8507, + "mean_token_accuracy": 0.7449314594268799, + "num_tokens": 23455531.0, + "step": 10140 + }, + { + "epoch": 0.09305950307142202, + "learning_rate": 0.00018138993307050517, + "loss": 0.8933, + "mean_token_accuracy": 0.7333428859710693, + "num_tokens": 23480250.0, + "step": 10150 + }, + { + "epoch": 0.09315118731090126, + "learning_rate": 0.00018137159622260936, + "loss": 0.8911, + "mean_token_accuracy": 0.7399576127529144, + "num_tokens": 23503635.0, + "step": 10160 + }, + { + "epoch": 0.0932428715503805, + "learning_rate": 0.0001813532593747135, + "loss": 0.8613, + "mean_token_accuracy": 0.7430021822452545, + "num_tokens": 23527143.0, + "step": 10170 + }, + { + "epoch": 0.09333455578985972, + "learning_rate": 0.00018133492252681764, + "loss": 0.8669, + "mean_token_accuracy": 0.7376038372516632, + "num_tokens": 23550196.0, + "step": 10180 + }, + { + "epoch": 0.09342624002933896, + "learning_rate": 0.0001813165856789218, + "loss": 0.9163, + "mean_token_accuracy": 0.7347811579704284, + "num_tokens": 23573328.0, + "step": 10190 + }, + { + "epoch": 0.09351792426881819, + "learning_rate": 0.00018129824883102595, + "loss": 0.8665, + "mean_token_accuracy": 0.7413029789924621, + "num_tokens": 23596881.0, + "step": 10200 + }, + { + "epoch": 0.09360960850829743, + "learning_rate": 0.0001812799119831301, + "loss": 0.9292, + "mean_token_accuracy": 0.7272100985050202, + "num_tokens": 23620234.0, + "step": 10210 + }, + { + "epoch": 0.09370129274777665, + "learning_rate": 0.00018126157513523425, + "loss": 0.8538, + "mean_token_accuracy": 0.7449434697628021, + "num_tokens": 23643870.0, + "step": 10220 + }, + { + "epoch": 0.09379297698725589, + "learning_rate": 0.00018124323828733841, + "loss": 0.9175, + "mean_token_accuracy": 0.7336058020591736, + "num_tokens": 23666228.0, + "step": 10230 + }, + { + "epoch": 0.09388466122673512, + "learning_rate": 0.00018122490143944258, + "loss": 0.8563, + "mean_token_accuracy": 0.7398800075054168, + "num_tokens": 23690317.0, + "step": 10240 + }, + { + "epoch": 0.09397634546621436, + "learning_rate": 0.00018120656459154672, + "loss": 0.8536, + "mean_token_accuracy": 0.7451589703559875, + "num_tokens": 23713023.0, + "step": 10250 + }, + { + "epoch": 0.09406802970569358, + "learning_rate": 0.00018118822774365088, + "loss": 0.9027, + "mean_token_accuracy": 0.7337402164936065, + "num_tokens": 23736779.0, + "step": 10260 + }, + { + "epoch": 0.09415971394517282, + "learning_rate": 0.00018116989089575502, + "loss": 0.8761, + "mean_token_accuracy": 0.7383345663547516, + "num_tokens": 23759880.0, + "step": 10270 + }, + { + "epoch": 0.09425139818465206, + "learning_rate": 0.00018115155404785916, + "loss": 0.884, + "mean_token_accuracy": 0.7440394878387451, + "num_tokens": 23782863.0, + "step": 10280 + }, + { + "epoch": 0.0943430824241313, + "learning_rate": 0.00018113321719996335, + "loss": 0.9068, + "mean_token_accuracy": 0.7336950719356536, + "num_tokens": 23806069.0, + "step": 10290 + }, + { + "epoch": 0.09443476666361053, + "learning_rate": 0.0001811148803520675, + "loss": 0.8937, + "mean_token_accuracy": 0.7380026817321778, + "num_tokens": 23829547.0, + "step": 10300 + }, + { + "epoch": 0.09452645090308975, + "learning_rate": 0.00018109654350417166, + "loss": 0.9029, + "mean_token_accuracy": 0.7320657312870026, + "num_tokens": 23852311.0, + "step": 10310 + }, + { + "epoch": 0.09461813514256899, + "learning_rate": 0.0001810782066562758, + "loss": 0.8758, + "mean_token_accuracy": 0.7432155132293701, + "num_tokens": 23875025.0, + "step": 10320 + }, + { + "epoch": 0.09470981938204823, + "learning_rate": 0.00018105986980837993, + "loss": 0.8583, + "mean_token_accuracy": 0.7418897330760956, + "num_tokens": 23898321.0, + "step": 10330 + }, + { + "epoch": 0.09480150362152746, + "learning_rate": 0.0001810415329604841, + "loss": 0.8863, + "mean_token_accuracy": 0.7378986597061157, + "num_tokens": 23922891.0, + "step": 10340 + }, + { + "epoch": 0.09489318786100669, + "learning_rate": 0.00018102319611258824, + "loss": 0.8774, + "mean_token_accuracy": 0.7400460600852966, + "num_tokens": 23945787.0, + "step": 10350 + }, + { + "epoch": 0.09498487210048592, + "learning_rate": 0.00018100485926469243, + "loss": 0.9182, + "mean_token_accuracy": 0.7314947068691253, + "num_tokens": 23969040.0, + "step": 10360 + }, + { + "epoch": 0.09507655633996516, + "learning_rate": 0.00018098652241679657, + "loss": 0.9068, + "mean_token_accuracy": 0.7313754498958588, + "num_tokens": 23992210.0, + "step": 10370 + }, + { + "epoch": 0.0951682405794444, + "learning_rate": 0.0001809681855689007, + "loss": 0.8971, + "mean_token_accuracy": 0.7337064266204834, + "num_tokens": 24014546.0, + "step": 10380 + }, + { + "epoch": 0.09525992481892363, + "learning_rate": 0.00018094984872100487, + "loss": 0.8936, + "mean_token_accuracy": 0.7389392912387848, + "num_tokens": 24037577.0, + "step": 10390 + }, + { + "epoch": 0.09535160905840286, + "learning_rate": 0.000180931511873109, + "loss": 0.8682, + "mean_token_accuracy": 0.7403826177120209, + "num_tokens": 24060043.0, + "step": 10400 + }, + { + "epoch": 0.09544329329788209, + "learning_rate": 0.00018091317502521318, + "loss": 0.8946, + "mean_token_accuracy": 0.737509262561798, + "num_tokens": 24083426.0, + "step": 10410 + }, + { + "epoch": 0.09553497753736133, + "learning_rate": 0.00018089483817731734, + "loss": 0.8635, + "mean_token_accuracy": 0.74267076253891, + "num_tokens": 24106035.0, + "step": 10420 + }, + { + "epoch": 0.09562666177684057, + "learning_rate": 0.00018087650132942148, + "loss": 0.8746, + "mean_token_accuracy": 0.741468733549118, + "num_tokens": 24128673.0, + "step": 10430 + }, + { + "epoch": 0.09571834601631979, + "learning_rate": 0.00018085816448152564, + "loss": 0.8833, + "mean_token_accuracy": 0.7361687660217285, + "num_tokens": 24151675.0, + "step": 10440 + }, + { + "epoch": 0.09581003025579903, + "learning_rate": 0.00018083982763362978, + "loss": 0.9131, + "mean_token_accuracy": 0.734002023935318, + "num_tokens": 24174869.0, + "step": 10450 + }, + { + "epoch": 0.09590171449527826, + "learning_rate": 0.00018082149078573395, + "loss": 0.881, + "mean_token_accuracy": 0.7427867949008942, + "num_tokens": 24198932.0, + "step": 10460 + }, + { + "epoch": 0.0959933987347575, + "learning_rate": 0.00018080315393783809, + "loss": 0.9253, + "mean_token_accuracy": 0.7226717889308929, + "num_tokens": 24220961.0, + "step": 10470 + }, + { + "epoch": 0.09608508297423674, + "learning_rate": 0.00018078481708994222, + "loss": 0.9018, + "mean_token_accuracy": 0.7350903332233429, + "num_tokens": 24243768.0, + "step": 10480 + }, + { + "epoch": 0.09617676721371596, + "learning_rate": 0.00018076648024204642, + "loss": 0.9096, + "mean_token_accuracy": 0.7298749208450317, + "num_tokens": 24267112.0, + "step": 10490 + }, + { + "epoch": 0.0962684514531952, + "learning_rate": 0.00018074814339415056, + "loss": 0.8537, + "mean_token_accuracy": 0.7433853507041931, + "num_tokens": 24290280.0, + "step": 10500 + }, + { + "epoch": 0.09636013569267443, + "learning_rate": 0.00018072980654625472, + "loss": 0.876, + "mean_token_accuracy": 0.7451959550380707, + "num_tokens": 24313419.0, + "step": 10510 + }, + { + "epoch": 0.09645181993215367, + "learning_rate": 0.00018071146969835886, + "loss": 0.8936, + "mean_token_accuracy": 0.7386884212493896, + "num_tokens": 24336293.0, + "step": 10520 + }, + { + "epoch": 0.09654350417163289, + "learning_rate": 0.000180693132850463, + "loss": 0.8308, + "mean_token_accuracy": 0.7562291979789734, + "num_tokens": 24359607.0, + "step": 10530 + }, + { + "epoch": 0.09663518841111213, + "learning_rate": 0.00018067479600256716, + "loss": 0.9069, + "mean_token_accuracy": 0.7358807027339935, + "num_tokens": 24383134.0, + "step": 10540 + }, + { + "epoch": 0.09672687265059136, + "learning_rate": 0.00018065645915467133, + "loss": 0.8859, + "mean_token_accuracy": 0.7362659752368927, + "num_tokens": 24405313.0, + "step": 10550 + }, + { + "epoch": 0.0968185568900706, + "learning_rate": 0.0001806381223067755, + "loss": 0.9059, + "mean_token_accuracy": 0.7316841602325439, + "num_tokens": 24428495.0, + "step": 10560 + }, + { + "epoch": 0.09691024112954984, + "learning_rate": 0.00018061978545887963, + "loss": 0.8603, + "mean_token_accuracy": 0.7400094747543335, + "num_tokens": 24451005.0, + "step": 10570 + }, + { + "epoch": 0.09700192536902906, + "learning_rate": 0.00018060144861098377, + "loss": 0.8448, + "mean_token_accuracy": 0.7427947461605072, + "num_tokens": 24474038.0, + "step": 10580 + }, + { + "epoch": 0.0970936096085083, + "learning_rate": 0.00018058311176308794, + "loss": 0.8342, + "mean_token_accuracy": 0.7481784880161285, + "num_tokens": 24497775.0, + "step": 10590 + }, + { + "epoch": 0.09718529384798753, + "learning_rate": 0.00018056477491519207, + "loss": 0.8443, + "mean_token_accuracy": 0.7447938144207, + "num_tokens": 24520891.0, + "step": 10600 + }, + { + "epoch": 0.09727697808746677, + "learning_rate": 0.00018054643806729624, + "loss": 0.8845, + "mean_token_accuracy": 0.7382242679595947, + "num_tokens": 24544005.0, + "step": 10610 + }, + { + "epoch": 0.09736866232694599, + "learning_rate": 0.0001805281012194004, + "loss": 0.8433, + "mean_token_accuracy": 0.750395393371582, + "num_tokens": 24566293.0, + "step": 10620 + }, + { + "epoch": 0.09746034656642523, + "learning_rate": 0.00018050976437150454, + "loss": 0.8766, + "mean_token_accuracy": 0.7411053121089936, + "num_tokens": 24589497.0, + "step": 10630 + }, + { + "epoch": 0.09755203080590447, + "learning_rate": 0.0001804914275236087, + "loss": 0.859, + "mean_token_accuracy": 0.7437268733978272, + "num_tokens": 24611898.0, + "step": 10640 + }, + { + "epoch": 0.0976437150453837, + "learning_rate": 0.00018047309067571285, + "loss": 0.8612, + "mean_token_accuracy": 0.7459022343158722, + "num_tokens": 24636191.0, + "step": 10650 + }, + { + "epoch": 0.09773539928486293, + "learning_rate": 0.000180454753827817, + "loss": 0.8518, + "mean_token_accuracy": 0.7471199095249176, + "num_tokens": 24659648.0, + "step": 10660 + }, + { + "epoch": 0.09782708352434216, + "learning_rate": 0.00018043641697992115, + "loss": 0.8632, + "mean_token_accuracy": 0.7440553903579712, + "num_tokens": 24682546.0, + "step": 10670 + }, + { + "epoch": 0.0979187677638214, + "learning_rate": 0.00018041808013202532, + "loss": 0.8861, + "mean_token_accuracy": 0.738535338640213, + "num_tokens": 24705496.0, + "step": 10680 + }, + { + "epoch": 0.09801045200330064, + "learning_rate": 0.00018039974328412948, + "loss": 0.8723, + "mean_token_accuracy": 0.7417737483978272, + "num_tokens": 24729135.0, + "step": 10690 + }, + { + "epoch": 0.09810213624277987, + "learning_rate": 0.00018038140643623362, + "loss": 0.8556, + "mean_token_accuracy": 0.7444552779197693, + "num_tokens": 24752266.0, + "step": 10700 + }, + { + "epoch": 0.0981938204822591, + "learning_rate": 0.00018036306958833779, + "loss": 0.8946, + "mean_token_accuracy": 0.7364124059677124, + "num_tokens": 24774873.0, + "step": 10710 + }, + { + "epoch": 0.09828550472173833, + "learning_rate": 0.00018034473274044192, + "loss": 0.8723, + "mean_token_accuracy": 0.7340504467487335, + "num_tokens": 24797617.0, + "step": 10720 + }, + { + "epoch": 0.09837718896121757, + "learning_rate": 0.00018032639589254606, + "loss": 0.8674, + "mean_token_accuracy": 0.7438235223293305, + "num_tokens": 24821454.0, + "step": 10730 + }, + { + "epoch": 0.0984688732006968, + "learning_rate": 0.00018030805904465023, + "loss": 0.9345, + "mean_token_accuracy": 0.7265106618404389, + "num_tokens": 24843857.0, + "step": 10740 + }, + { + "epoch": 0.09856055744017603, + "learning_rate": 0.0001802897221967544, + "loss": 0.8589, + "mean_token_accuracy": 0.7420856058597565, + "num_tokens": 24867256.0, + "step": 10750 + }, + { + "epoch": 0.09865224167965526, + "learning_rate": 0.00018027138534885856, + "loss": 0.9076, + "mean_token_accuracy": 0.7344007968902588, + "num_tokens": 24890614.0, + "step": 10760 + }, + { + "epoch": 0.0987439259191345, + "learning_rate": 0.0001802530485009627, + "loss": 0.8276, + "mean_token_accuracy": 0.7482860684394836, + "num_tokens": 24913653.0, + "step": 10770 + }, + { + "epoch": 0.09883561015861374, + "learning_rate": 0.00018023471165306683, + "loss": 0.9213, + "mean_token_accuracy": 0.7255630433559418, + "num_tokens": 24936755.0, + "step": 10780 + }, + { + "epoch": 0.09892729439809297, + "learning_rate": 0.000180216374805171, + "loss": 0.8781, + "mean_token_accuracy": 0.7428742527961731, + "num_tokens": 24960279.0, + "step": 10790 + }, + { + "epoch": 0.0990189786375722, + "learning_rate": 0.00018019803795727514, + "loss": 0.8811, + "mean_token_accuracy": 0.7340105235576629, + "num_tokens": 24982434.0, + "step": 10800 + }, + { + "epoch": 0.09911066287705143, + "learning_rate": 0.0001801797011093793, + "loss": 0.8861, + "mean_token_accuracy": 0.7397896409034729, + "num_tokens": 25005674.0, + "step": 10810 + }, + { + "epoch": 0.09920234711653067, + "learning_rate": 0.00018016136426148347, + "loss": 0.8681, + "mean_token_accuracy": 0.7424762189388275, + "num_tokens": 25029219.0, + "step": 10820 + }, + { + "epoch": 0.0992940313560099, + "learning_rate": 0.0001801430274135876, + "loss": 0.8851, + "mean_token_accuracy": 0.7344321787357331, + "num_tokens": 25051932.0, + "step": 10830 + }, + { + "epoch": 0.09938571559548913, + "learning_rate": 0.00018012469056569177, + "loss": 0.9175, + "mean_token_accuracy": 0.7275677442550659, + "num_tokens": 25075651.0, + "step": 10840 + }, + { + "epoch": 0.09947739983496837, + "learning_rate": 0.0001801063537177959, + "loss": 0.8489, + "mean_token_accuracy": 0.7498330891132354, + "num_tokens": 25098936.0, + "step": 10850 + }, + { + "epoch": 0.0995690840744476, + "learning_rate": 0.00018008801686990008, + "loss": 0.9123, + "mean_token_accuracy": 0.7343634068965912, + "num_tokens": 25121710.0, + "step": 10860 + }, + { + "epoch": 0.09966076831392684, + "learning_rate": 0.00018006968002200422, + "loss": 0.8283, + "mean_token_accuracy": 0.7467993855476379, + "num_tokens": 25144107.0, + "step": 10870 + }, + { + "epoch": 0.09975245255340608, + "learning_rate": 0.00018005134317410838, + "loss": 0.8872, + "mean_token_accuracy": 0.7347580850124359, + "num_tokens": 25166860.0, + "step": 10880 + }, + { + "epoch": 0.0998441367928853, + "learning_rate": 0.00018003300632621255, + "loss": 0.8845, + "mean_token_accuracy": 0.7424611270427703, + "num_tokens": 25190298.0, + "step": 10890 + }, + { + "epoch": 0.09993582103236454, + "learning_rate": 0.00018001466947831668, + "loss": 0.8873, + "mean_token_accuracy": 0.7385188579559326, + "num_tokens": 25213595.0, + "step": 10900 + }, + { + "epoch": 0.10002750527184377, + "learning_rate": 0.00017999633263042085, + "loss": 0.8652, + "mean_token_accuracy": 0.7345197677612305, + "num_tokens": 25236233.0, + "step": 10910 + }, + { + "epoch": 0.10011918951132301, + "learning_rate": 0.000179977995782525, + "loss": 0.9006, + "mean_token_accuracy": 0.7335421979427338, + "num_tokens": 25259579.0, + "step": 10920 + }, + { + "epoch": 0.10021087375080223, + "learning_rate": 0.00017995965893462913, + "loss": 0.891, + "mean_token_accuracy": 0.7389984250068664, + "num_tokens": 25282412.0, + "step": 10930 + }, + { + "epoch": 0.10030255799028147, + "learning_rate": 0.0001799413220867333, + "loss": 0.8625, + "mean_token_accuracy": 0.7452229619026184, + "num_tokens": 25305507.0, + "step": 10940 + }, + { + "epoch": 0.1003942422297607, + "learning_rate": 0.00017992298523883746, + "loss": 0.8811, + "mean_token_accuracy": 0.7357382118701935, + "num_tokens": 25329647.0, + "step": 10950 + }, + { + "epoch": 0.10048592646923994, + "learning_rate": 0.00017990464839094162, + "loss": 0.8681, + "mean_token_accuracy": 0.7397084474563599, + "num_tokens": 25353597.0, + "step": 10960 + }, + { + "epoch": 0.10057761070871916, + "learning_rate": 0.00017988631154304576, + "loss": 0.8788, + "mean_token_accuracy": 0.744835251569748, + "num_tokens": 25377101.0, + "step": 10970 + }, + { + "epoch": 0.1006692949481984, + "learning_rate": 0.0001798679746951499, + "loss": 0.8753, + "mean_token_accuracy": 0.739315527677536, + "num_tokens": 25400047.0, + "step": 10980 + }, + { + "epoch": 0.10076097918767764, + "learning_rate": 0.00017984963784725406, + "loss": 0.8854, + "mean_token_accuracy": 0.733559387922287, + "num_tokens": 25423305.0, + "step": 10990 + }, + { + "epoch": 0.10085266342715687, + "learning_rate": 0.0001798313009993582, + "loss": 0.8619, + "mean_token_accuracy": 0.7448963761329651, + "num_tokens": 25446291.0, + "step": 11000 + }, + { + "epoch": 0.10094434766663611, + "learning_rate": 0.00017981296415146237, + "loss": 0.8818, + "mean_token_accuracy": 0.7425753057003022, + "num_tokens": 25469812.0, + "step": 11010 + }, + { + "epoch": 0.10103603190611533, + "learning_rate": 0.00017979462730356653, + "loss": 0.8753, + "mean_token_accuracy": 0.7363907277584076, + "num_tokens": 25492493.0, + "step": 11020 + }, + { + "epoch": 0.10112771614559457, + "learning_rate": 0.00017977629045567067, + "loss": 0.8438, + "mean_token_accuracy": 0.7488499164581299, + "num_tokens": 25516184.0, + "step": 11030 + }, + { + "epoch": 0.10121940038507381, + "learning_rate": 0.00017975795360777484, + "loss": 0.8408, + "mean_token_accuracy": 0.7440124809741974, + "num_tokens": 25539516.0, + "step": 11040 + }, + { + "epoch": 0.10131108462455304, + "learning_rate": 0.00017973961675987898, + "loss": 0.9001, + "mean_token_accuracy": 0.7308463513851166, + "num_tokens": 25563494.0, + "step": 11050 + }, + { + "epoch": 0.10140276886403227, + "learning_rate": 0.00017972127991198314, + "loss": 0.8787, + "mean_token_accuracy": 0.7380222618579865, + "num_tokens": 25587273.0, + "step": 11060 + }, + { + "epoch": 0.1014944531035115, + "learning_rate": 0.00017970294306408728, + "loss": 0.8705, + "mean_token_accuracy": 0.739801687002182, + "num_tokens": 25610363.0, + "step": 11070 + }, + { + "epoch": 0.10158613734299074, + "learning_rate": 0.00017968460621619145, + "loss": 0.8621, + "mean_token_accuracy": 0.7454406261444092, + "num_tokens": 25632975.0, + "step": 11080 + }, + { + "epoch": 0.10167782158246998, + "learning_rate": 0.0001796662693682956, + "loss": 0.8685, + "mean_token_accuracy": 0.7407660961151123, + "num_tokens": 25656036.0, + "step": 11090 + }, + { + "epoch": 0.10176950582194921, + "learning_rate": 0.00017964793252039975, + "loss": 0.8875, + "mean_token_accuracy": 0.739461475610733, + "num_tokens": 25679393.0, + "step": 11100 + }, + { + "epoch": 0.10186119006142844, + "learning_rate": 0.00017962959567250391, + "loss": 0.8769, + "mean_token_accuracy": 0.7353558778762818, + "num_tokens": 25702762.0, + "step": 11110 + }, + { + "epoch": 0.10195287430090767, + "learning_rate": 0.00017961125882460805, + "loss": 0.9116, + "mean_token_accuracy": 0.7379616916179657, + "num_tokens": 25725428.0, + "step": 11120 + }, + { + "epoch": 0.10204455854038691, + "learning_rate": 0.0001795929219767122, + "loss": 0.9091, + "mean_token_accuracy": 0.7295917868614197, + "num_tokens": 25748562.0, + "step": 11130 + }, + { + "epoch": 0.10213624277986615, + "learning_rate": 0.00017957458512881638, + "loss": 0.8869, + "mean_token_accuracy": 0.7402543067932129, + "num_tokens": 25772133.0, + "step": 11140 + }, + { + "epoch": 0.10222792701934537, + "learning_rate": 0.00017955624828092052, + "loss": 0.8982, + "mean_token_accuracy": 0.724835330247879, + "num_tokens": 25794433.0, + "step": 11150 + }, + { + "epoch": 0.1023196112588246, + "learning_rate": 0.0001795379114330247, + "loss": 0.8815, + "mean_token_accuracy": 0.7409479439258575, + "num_tokens": 25816895.0, + "step": 11160 + }, + { + "epoch": 0.10241129549830384, + "learning_rate": 0.00017951957458512883, + "loss": 0.8936, + "mean_token_accuracy": 0.7375987052917481, + "num_tokens": 25839641.0, + "step": 11170 + }, + { + "epoch": 0.10250297973778308, + "learning_rate": 0.00017950123773723296, + "loss": 0.8588, + "mean_token_accuracy": 0.7427475035190583, + "num_tokens": 25862957.0, + "step": 11180 + }, + { + "epoch": 0.10259466397726232, + "learning_rate": 0.00017948290088933713, + "loss": 0.9123, + "mean_token_accuracy": 0.7334792375564575, + "num_tokens": 25886323.0, + "step": 11190 + }, + { + "epoch": 0.10268634821674154, + "learning_rate": 0.00017946456404144127, + "loss": 0.8911, + "mean_token_accuracy": 0.7416549921035767, + "num_tokens": 25909248.0, + "step": 11200 + }, + { + "epoch": 0.10277803245622077, + "learning_rate": 0.00017944622719354543, + "loss": 0.9048, + "mean_token_accuracy": 0.730409562587738, + "num_tokens": 25932875.0, + "step": 11210 + }, + { + "epoch": 0.10286971669570001, + "learning_rate": 0.0001794278903456496, + "loss": 0.86, + "mean_token_accuracy": 0.7465738594532013, + "num_tokens": 25955886.0, + "step": 11220 + }, + { + "epoch": 0.10296140093517925, + "learning_rate": 0.00017940955349775374, + "loss": 0.9391, + "mean_token_accuracy": 0.7274121463298797, + "num_tokens": 25979004.0, + "step": 11230 + }, + { + "epoch": 0.10305308517465847, + "learning_rate": 0.0001793912166498579, + "loss": 0.8983, + "mean_token_accuracy": 0.7318204581737519, + "num_tokens": 26002269.0, + "step": 11240 + }, + { + "epoch": 0.10314476941413771, + "learning_rate": 0.00017937287980196204, + "loss": 0.879, + "mean_token_accuracy": 0.7433506727218628, + "num_tokens": 26026515.0, + "step": 11250 + }, + { + "epoch": 0.10323645365361694, + "learning_rate": 0.0001793545429540662, + "loss": 0.8626, + "mean_token_accuracy": 0.7416462600231171, + "num_tokens": 26050493.0, + "step": 11260 + }, + { + "epoch": 0.10332813789309618, + "learning_rate": 0.00017933620610617037, + "loss": 0.9057, + "mean_token_accuracy": 0.7388849973678588, + "num_tokens": 26073510.0, + "step": 11270 + }, + { + "epoch": 0.1034198221325754, + "learning_rate": 0.0001793178692582745, + "loss": 0.9024, + "mean_token_accuracy": 0.7374939978122711, + "num_tokens": 26096348.0, + "step": 11280 + }, + { + "epoch": 0.10351150637205464, + "learning_rate": 0.00017929953241037868, + "loss": 0.8201, + "mean_token_accuracy": 0.7585200309753418, + "num_tokens": 26119821.0, + "step": 11290 + }, + { + "epoch": 0.10360319061153388, + "learning_rate": 0.0001792811955624828, + "loss": 0.8929, + "mean_token_accuracy": 0.7429881691932678, + "num_tokens": 26143672.0, + "step": 11300 + }, + { + "epoch": 0.10369487485101311, + "learning_rate": 0.00017926285871458698, + "loss": 0.8975, + "mean_token_accuracy": 0.7410037696361542, + "num_tokens": 26166411.0, + "step": 11310 + }, + { + "epoch": 0.10378655909049235, + "learning_rate": 0.00017924452186669112, + "loss": 0.9039, + "mean_token_accuracy": 0.7327254235744476, + "num_tokens": 26190002.0, + "step": 11320 + }, + { + "epoch": 0.10387824332997157, + "learning_rate": 0.00017922618501879526, + "loss": 0.884, + "mean_token_accuracy": 0.739010089635849, + "num_tokens": 26213467.0, + "step": 11330 + }, + { + "epoch": 0.10396992756945081, + "learning_rate": 0.00017920784817089945, + "loss": 0.8971, + "mean_token_accuracy": 0.7366046905517578, + "num_tokens": 26237288.0, + "step": 11340 + }, + { + "epoch": 0.10406161180893005, + "learning_rate": 0.00017918951132300359, + "loss": 0.8914, + "mean_token_accuracy": 0.7392790913581848, + "num_tokens": 26260388.0, + "step": 11350 + }, + { + "epoch": 0.10415329604840928, + "learning_rate": 0.00017917117447510775, + "loss": 0.883, + "mean_token_accuracy": 0.7385203599929809, + "num_tokens": 26284016.0, + "step": 11360 + }, + { + "epoch": 0.1042449802878885, + "learning_rate": 0.0001791528376272119, + "loss": 0.9186, + "mean_token_accuracy": 0.7294337689876557, + "num_tokens": 26307725.0, + "step": 11370 + }, + { + "epoch": 0.10433666452736774, + "learning_rate": 0.00017913450077931603, + "loss": 0.872, + "mean_token_accuracy": 0.740067058801651, + "num_tokens": 26330659.0, + "step": 11380 + }, + { + "epoch": 0.10442834876684698, + "learning_rate": 0.0001791161639314202, + "loss": 0.8711, + "mean_token_accuracy": 0.7400892734527588, + "num_tokens": 26353488.0, + "step": 11390 + }, + { + "epoch": 0.10452003300632622, + "learning_rate": 0.00017909782708352436, + "loss": 0.8859, + "mean_token_accuracy": 0.7375518560409546, + "num_tokens": 26376672.0, + "step": 11400 + }, + { + "epoch": 0.10461171724580545, + "learning_rate": 0.0001790794902356285, + "loss": 0.8924, + "mean_token_accuracy": 0.7375367045402527, + "num_tokens": 26400298.0, + "step": 11410 + }, + { + "epoch": 0.10470340148528468, + "learning_rate": 0.00017906115338773266, + "loss": 0.8716, + "mean_token_accuracy": 0.7399585485458374, + "num_tokens": 26422697.0, + "step": 11420 + }, + { + "epoch": 0.10479508572476391, + "learning_rate": 0.0001790428165398368, + "loss": 0.877, + "mean_token_accuracy": 0.7456361293792725, + "num_tokens": 26445665.0, + "step": 11430 + }, + { + "epoch": 0.10488676996424315, + "learning_rate": 0.00017902447969194097, + "loss": 0.8833, + "mean_token_accuracy": 0.7388562619686126, + "num_tokens": 26469096.0, + "step": 11440 + }, + { + "epoch": 0.10497845420372239, + "learning_rate": 0.0001790061428440451, + "loss": 0.8758, + "mean_token_accuracy": 0.744290167093277, + "num_tokens": 26492195.0, + "step": 11450 + }, + { + "epoch": 0.10507013844320161, + "learning_rate": 0.00017898780599614927, + "loss": 0.8701, + "mean_token_accuracy": 0.7436373651027679, + "num_tokens": 26515123.0, + "step": 11460 + }, + { + "epoch": 0.10516182268268084, + "learning_rate": 0.00017896946914825344, + "loss": 0.8677, + "mean_token_accuracy": 0.7376021027565003, + "num_tokens": 26538101.0, + "step": 11470 + }, + { + "epoch": 0.10525350692216008, + "learning_rate": 0.00017895113230035757, + "loss": 0.9099, + "mean_token_accuracy": 0.7306402206420899, + "num_tokens": 26560984.0, + "step": 11480 + }, + { + "epoch": 0.10534519116163932, + "learning_rate": 0.00017893279545246174, + "loss": 0.8278, + "mean_token_accuracy": 0.7509335875511169, + "num_tokens": 26584906.0, + "step": 11490 + }, + { + "epoch": 0.10543687540111855, + "learning_rate": 0.00017891445860456588, + "loss": 0.8929, + "mean_token_accuracy": 0.7350357353687287, + "num_tokens": 26607470.0, + "step": 11500 + }, + { + "epoch": 0.10552855964059778, + "learning_rate": 0.00017889612175667004, + "loss": 0.8589, + "mean_token_accuracy": 0.7428408443927765, + "num_tokens": 26630872.0, + "step": 11510 + }, + { + "epoch": 0.10562024388007701, + "learning_rate": 0.00017887778490877418, + "loss": 0.9204, + "mean_token_accuracy": 0.7317827820777894, + "num_tokens": 26653759.0, + "step": 11520 + }, + { + "epoch": 0.10571192811955625, + "learning_rate": 0.00017885944806087835, + "loss": 0.9528, + "mean_token_accuracy": 0.7178638577461243, + "num_tokens": 26677121.0, + "step": 11530 + }, + { + "epoch": 0.10580361235903549, + "learning_rate": 0.0001788411112129825, + "loss": 0.8625, + "mean_token_accuracy": 0.7380670189857483, + "num_tokens": 26700678.0, + "step": 11540 + }, + { + "epoch": 0.10589529659851471, + "learning_rate": 0.00017882277436508665, + "loss": 0.9528, + "mean_token_accuracy": 0.7202961683273316, + "num_tokens": 26724084.0, + "step": 11550 + }, + { + "epoch": 0.10598698083799395, + "learning_rate": 0.00017880443751719082, + "loss": 0.8636, + "mean_token_accuracy": 0.7396840393543244, + "num_tokens": 26746786.0, + "step": 11560 + }, + { + "epoch": 0.10607866507747318, + "learning_rate": 0.00017878610066929495, + "loss": 0.8728, + "mean_token_accuracy": 0.7380404055118561, + "num_tokens": 26770909.0, + "step": 11570 + }, + { + "epoch": 0.10617034931695242, + "learning_rate": 0.0001787677638213991, + "loss": 0.8609, + "mean_token_accuracy": 0.7454233050346375, + "num_tokens": 26794119.0, + "step": 11580 + }, + { + "epoch": 0.10626203355643164, + "learning_rate": 0.00017874942697350326, + "loss": 0.8557, + "mean_token_accuracy": 0.7433999359607697, + "num_tokens": 26817096.0, + "step": 11590 + }, + { + "epoch": 0.10635371779591088, + "learning_rate": 0.00017873109012560742, + "loss": 0.8296, + "mean_token_accuracy": 0.7519002318382263, + "num_tokens": 26840201.0, + "step": 11600 + }, + { + "epoch": 0.10644540203539012, + "learning_rate": 0.00017871275327771156, + "loss": 0.8736, + "mean_token_accuracy": 0.7433995008468628, + "num_tokens": 26862945.0, + "step": 11610 + }, + { + "epoch": 0.10653708627486935, + "learning_rate": 0.00017869441642981573, + "loss": 0.9185, + "mean_token_accuracy": 0.7319000780582428, + "num_tokens": 26886709.0, + "step": 11620 + }, + { + "epoch": 0.10662877051434859, + "learning_rate": 0.00017867607958191987, + "loss": 0.8349, + "mean_token_accuracy": 0.7504717409610748, + "num_tokens": 26909972.0, + "step": 11630 + }, + { + "epoch": 0.10672045475382781, + "learning_rate": 0.00017865774273402403, + "loss": 0.8242, + "mean_token_accuracy": 0.7521531820297241, + "num_tokens": 26932887.0, + "step": 11640 + }, + { + "epoch": 0.10681213899330705, + "learning_rate": 0.00017863940588612817, + "loss": 0.8836, + "mean_token_accuracy": 0.7407630920410156, + "num_tokens": 26955995.0, + "step": 11650 + }, + { + "epoch": 0.10690382323278629, + "learning_rate": 0.00017862106903823233, + "loss": 0.8662, + "mean_token_accuracy": 0.7427942395210266, + "num_tokens": 26979091.0, + "step": 11660 + }, + { + "epoch": 0.10699550747226552, + "learning_rate": 0.0001786027321903365, + "loss": 0.8595, + "mean_token_accuracy": 0.7429852724075318, + "num_tokens": 27001826.0, + "step": 11670 + }, + { + "epoch": 0.10708719171174474, + "learning_rate": 0.00017858439534244064, + "loss": 0.883, + "mean_token_accuracy": 0.7366941869258881, + "num_tokens": 27024878.0, + "step": 11680 + }, + { + "epoch": 0.10717887595122398, + "learning_rate": 0.0001785660584945448, + "loss": 0.8858, + "mean_token_accuracy": 0.7402225613594056, + "num_tokens": 27047969.0, + "step": 11690 + }, + { + "epoch": 0.10727056019070322, + "learning_rate": 0.00017854772164664894, + "loss": 0.8596, + "mean_token_accuracy": 0.743378323316574, + "num_tokens": 27070948.0, + "step": 11700 + }, + { + "epoch": 0.10736224443018245, + "learning_rate": 0.0001785293847987531, + "loss": 0.9495, + "mean_token_accuracy": 0.7240637183189392, + "num_tokens": 27094089.0, + "step": 11710 + }, + { + "epoch": 0.10745392866966169, + "learning_rate": 0.00017851104795085725, + "loss": 0.8912, + "mean_token_accuracy": 0.7427623808383942, + "num_tokens": 27117513.0, + "step": 11720 + }, + { + "epoch": 0.10754561290914091, + "learning_rate": 0.0001784927111029614, + "loss": 0.8667, + "mean_token_accuracy": 0.7423351585865021, + "num_tokens": 27141568.0, + "step": 11730 + }, + { + "epoch": 0.10763729714862015, + "learning_rate": 0.00017847437425506558, + "loss": 0.881, + "mean_token_accuracy": 0.7310326814651489, + "num_tokens": 27163758.0, + "step": 11740 + }, + { + "epoch": 0.10772898138809939, + "learning_rate": 0.00017845603740716972, + "loss": 0.8859, + "mean_token_accuracy": 0.7359584927558899, + "num_tokens": 27187215.0, + "step": 11750 + }, + { + "epoch": 0.10782066562757862, + "learning_rate": 0.00017843770055927388, + "loss": 0.8947, + "mean_token_accuracy": 0.7310957431793212, + "num_tokens": 27210322.0, + "step": 11760 + }, + { + "epoch": 0.10791234986705785, + "learning_rate": 0.00017841936371137802, + "loss": 0.9138, + "mean_token_accuracy": 0.7403761386871338, + "num_tokens": 27233377.0, + "step": 11770 + }, + { + "epoch": 0.10800403410653708, + "learning_rate": 0.00017840102686348216, + "loss": 0.8994, + "mean_token_accuracy": 0.7380115389823914, + "num_tokens": 27257227.0, + "step": 11780 + }, + { + "epoch": 0.10809571834601632, + "learning_rate": 0.00017838269001558635, + "loss": 0.8864, + "mean_token_accuracy": 0.738403606414795, + "num_tokens": 27280152.0, + "step": 11790 + }, + { + "epoch": 0.10818740258549556, + "learning_rate": 0.0001783643531676905, + "loss": 0.8818, + "mean_token_accuracy": 0.7386031329631806, + "num_tokens": 27304010.0, + "step": 11800 + }, + { + "epoch": 0.1082790868249748, + "learning_rate": 0.00017834601631979463, + "loss": 0.8917, + "mean_token_accuracy": 0.7318453073501587, + "num_tokens": 27326802.0, + "step": 11810 + }, + { + "epoch": 0.10837077106445402, + "learning_rate": 0.0001783276794718988, + "loss": 0.8832, + "mean_token_accuracy": 0.7354330539703369, + "num_tokens": 27349795.0, + "step": 11820 + }, + { + "epoch": 0.10846245530393325, + "learning_rate": 0.00017830934262400293, + "loss": 0.903, + "mean_token_accuracy": 0.7374026656150818, + "num_tokens": 27373434.0, + "step": 11830 + }, + { + "epoch": 0.10855413954341249, + "learning_rate": 0.0001782910057761071, + "loss": 0.8614, + "mean_token_accuracy": 0.7449547350406647, + "num_tokens": 27396953.0, + "step": 11840 + }, + { + "epoch": 0.10864582378289173, + "learning_rate": 0.00017827266892821123, + "loss": 0.8781, + "mean_token_accuracy": 0.7443978965282441, + "num_tokens": 27420440.0, + "step": 11850 + }, + { + "epoch": 0.10873750802237095, + "learning_rate": 0.0001782543320803154, + "loss": 0.8807, + "mean_token_accuracy": 0.7423559188842773, + "num_tokens": 27443543.0, + "step": 11860 + }, + { + "epoch": 0.10882919226185019, + "learning_rate": 0.00017823599523241956, + "loss": 0.8782, + "mean_token_accuracy": 0.7370914876461029, + "num_tokens": 27466587.0, + "step": 11870 + }, + { + "epoch": 0.10892087650132942, + "learning_rate": 0.0001782176583845237, + "loss": 0.8544, + "mean_token_accuracy": 0.7436290860176087, + "num_tokens": 27488972.0, + "step": 11880 + }, + { + "epoch": 0.10901256074080866, + "learning_rate": 0.00017819932153662787, + "loss": 0.882, + "mean_token_accuracy": 0.74011932015419, + "num_tokens": 27511518.0, + "step": 11890 + }, + { + "epoch": 0.10910424498028788, + "learning_rate": 0.000178180984688732, + "loss": 0.8835, + "mean_token_accuracy": 0.7381210803985596, + "num_tokens": 27533827.0, + "step": 11900 + }, + { + "epoch": 0.10919592921976712, + "learning_rate": 0.00017816264784083617, + "loss": 0.8848, + "mean_token_accuracy": 0.74366534948349, + "num_tokens": 27557508.0, + "step": 11910 + }, + { + "epoch": 0.10928761345924635, + "learning_rate": 0.00017814431099294034, + "loss": 0.8958, + "mean_token_accuracy": 0.7379620313644409, + "num_tokens": 27580767.0, + "step": 11920 + }, + { + "epoch": 0.10937929769872559, + "learning_rate": 0.00017812597414504448, + "loss": 0.8636, + "mean_token_accuracy": 0.7385945558547974, + "num_tokens": 27603997.0, + "step": 11930 + }, + { + "epoch": 0.10947098193820483, + "learning_rate": 0.00017810763729714864, + "loss": 0.8549, + "mean_token_accuracy": 0.7429787874221802, + "num_tokens": 27626885.0, + "step": 11940 + }, + { + "epoch": 0.10956266617768405, + "learning_rate": 0.00017808930044925278, + "loss": 0.8777, + "mean_token_accuracy": 0.7384230136871338, + "num_tokens": 27649938.0, + "step": 11950 + }, + { + "epoch": 0.10965435041716329, + "learning_rate": 0.00017807096360135695, + "loss": 0.8872, + "mean_token_accuracy": 0.7369516789913177, + "num_tokens": 27673030.0, + "step": 11960 + }, + { + "epoch": 0.10974603465664252, + "learning_rate": 0.00017805262675346108, + "loss": 0.8647, + "mean_token_accuracy": 0.7508829653263092, + "num_tokens": 27695459.0, + "step": 11970 + }, + { + "epoch": 0.10983771889612176, + "learning_rate": 0.00017803428990556522, + "loss": 0.8792, + "mean_token_accuracy": 0.7326285004615783, + "num_tokens": 27718179.0, + "step": 11980 + }, + { + "epoch": 0.10992940313560098, + "learning_rate": 0.00017801595305766941, + "loss": 0.8683, + "mean_token_accuracy": 0.7448980331420898, + "num_tokens": 27740608.0, + "step": 11990 + }, + { + "epoch": 0.11002108737508022, + "learning_rate": 0.00017799761620977355, + "loss": 0.8489, + "mean_token_accuracy": 0.7497345745563507, + "num_tokens": 27764201.0, + "step": 12000 + }, + { + "epoch": 0.11011277161455946, + "learning_rate": 0.00017797927936187772, + "loss": 0.8729, + "mean_token_accuracy": 0.7328741371631622, + "num_tokens": 27787189.0, + "step": 12010 + }, + { + "epoch": 0.1102044558540387, + "learning_rate": 0.00017796094251398186, + "loss": 0.9071, + "mean_token_accuracy": 0.7407233119010925, + "num_tokens": 27811354.0, + "step": 12020 + }, + { + "epoch": 0.11029614009351793, + "learning_rate": 0.000177942605666086, + "loss": 0.8717, + "mean_token_accuracy": 0.7401291847229003, + "num_tokens": 27834739.0, + "step": 12030 + }, + { + "epoch": 0.11038782433299715, + "learning_rate": 0.00017792426881819016, + "loss": 0.8729, + "mean_token_accuracy": 0.7361323416233063, + "num_tokens": 27857881.0, + "step": 12040 + }, + { + "epoch": 0.11047950857247639, + "learning_rate": 0.0001779059319702943, + "loss": 0.8754, + "mean_token_accuracy": 0.7374109506607056, + "num_tokens": 27880926.0, + "step": 12050 + }, + { + "epoch": 0.11057119281195563, + "learning_rate": 0.00017788759512239846, + "loss": 0.916, + "mean_token_accuracy": 0.7358609676361084, + "num_tokens": 27903447.0, + "step": 12060 + }, + { + "epoch": 0.11066287705143486, + "learning_rate": 0.00017786925827450263, + "loss": 0.8911, + "mean_token_accuracy": 0.734874165058136, + "num_tokens": 27926965.0, + "step": 12070 + }, + { + "epoch": 0.11075456129091409, + "learning_rate": 0.00017785092142660677, + "loss": 0.852, + "mean_token_accuracy": 0.743153166770935, + "num_tokens": 27949419.0, + "step": 12080 + }, + { + "epoch": 0.11084624553039332, + "learning_rate": 0.00017783258457871093, + "loss": 0.8693, + "mean_token_accuracy": 0.7415815830230713, + "num_tokens": 27973278.0, + "step": 12090 + }, + { + "epoch": 0.11093792976987256, + "learning_rate": 0.00017781424773081507, + "loss": 0.8617, + "mean_token_accuracy": 0.7533626735210419, + "num_tokens": 27995873.0, + "step": 12100 + }, + { + "epoch": 0.1110296140093518, + "learning_rate": 0.00017779591088291924, + "loss": 0.8951, + "mean_token_accuracy": 0.7394928812980652, + "num_tokens": 28019131.0, + "step": 12110 + }, + { + "epoch": 0.11112129824883103, + "learning_rate": 0.0001777775740350234, + "loss": 0.904, + "mean_token_accuracy": 0.7413673281669617, + "num_tokens": 28042400.0, + "step": 12120 + }, + { + "epoch": 0.11121298248831026, + "learning_rate": 0.00017775923718712754, + "loss": 0.8818, + "mean_token_accuracy": 0.7390436410903931, + "num_tokens": 28065576.0, + "step": 12130 + }, + { + "epoch": 0.11130466672778949, + "learning_rate": 0.0001777409003392317, + "loss": 0.8783, + "mean_token_accuracy": 0.7301335394382477, + "num_tokens": 28088931.0, + "step": 12140 + }, + { + "epoch": 0.11139635096726873, + "learning_rate": 0.00017772256349133584, + "loss": 0.843, + "mean_token_accuracy": 0.7469180881977081, + "num_tokens": 28112217.0, + "step": 12150 + }, + { + "epoch": 0.11148803520674797, + "learning_rate": 0.00017770422664344, + "loss": 0.8482, + "mean_token_accuracy": 0.7464567482471466, + "num_tokens": 28135744.0, + "step": 12160 + }, + { + "epoch": 0.11157971944622719, + "learning_rate": 0.00017768588979554415, + "loss": 0.907, + "mean_token_accuracy": 0.7300693154335022, + "num_tokens": 28158330.0, + "step": 12170 + }, + { + "epoch": 0.11167140368570642, + "learning_rate": 0.00017766755294764829, + "loss": 0.8557, + "mean_token_accuracy": 0.7448145389556885, + "num_tokens": 28182363.0, + "step": 12180 + }, + { + "epoch": 0.11176308792518566, + "learning_rate": 0.00017764921609975248, + "loss": 0.8375, + "mean_token_accuracy": 0.748042207956314, + "num_tokens": 28205894.0, + "step": 12190 + }, + { + "epoch": 0.1118547721646649, + "learning_rate": 0.00017763087925185662, + "loss": 0.894, + "mean_token_accuracy": 0.7306191265583039, + "num_tokens": 28228515.0, + "step": 12200 + }, + { + "epoch": 0.11194645640414412, + "learning_rate": 0.00017761254240396078, + "loss": 0.8945, + "mean_token_accuracy": 0.7436901509761811, + "num_tokens": 28251754.0, + "step": 12210 + }, + { + "epoch": 0.11203814064362336, + "learning_rate": 0.00017759420555606492, + "loss": 0.851, + "mean_token_accuracy": 0.7463106334209442, + "num_tokens": 28274595.0, + "step": 12220 + }, + { + "epoch": 0.1121298248831026, + "learning_rate": 0.00017757586870816906, + "loss": 0.9214, + "mean_token_accuracy": 0.7293797373771668, + "num_tokens": 28297840.0, + "step": 12230 + }, + { + "epoch": 0.11222150912258183, + "learning_rate": 0.00017755753186027322, + "loss": 0.8924, + "mean_token_accuracy": 0.7376773357391357, + "num_tokens": 28320452.0, + "step": 12240 + }, + { + "epoch": 0.11231319336206107, + "learning_rate": 0.0001775391950123774, + "loss": 0.8673, + "mean_token_accuracy": 0.7442586421966553, + "num_tokens": 28343099.0, + "step": 12250 + }, + { + "epoch": 0.11240487760154029, + "learning_rate": 0.00017752085816448153, + "loss": 0.8665, + "mean_token_accuracy": 0.7418373227119446, + "num_tokens": 28366627.0, + "step": 12260 + }, + { + "epoch": 0.11249656184101953, + "learning_rate": 0.0001775025213165857, + "loss": 0.8692, + "mean_token_accuracy": 0.7441459059715271, + "num_tokens": 28389832.0, + "step": 12270 + }, + { + "epoch": 0.11258824608049876, + "learning_rate": 0.00017748418446868983, + "loss": 0.9088, + "mean_token_accuracy": 0.7338151514530182, + "num_tokens": 28413462.0, + "step": 12280 + }, + { + "epoch": 0.112679930319978, + "learning_rate": 0.000177465847620794, + "loss": 0.909, + "mean_token_accuracy": 0.7330934405326843, + "num_tokens": 28437242.0, + "step": 12290 + }, + { + "epoch": 0.11277161455945722, + "learning_rate": 0.00017744751077289814, + "loss": 0.9082, + "mean_token_accuracy": 0.7337328672409058, + "num_tokens": 28460968.0, + "step": 12300 + }, + { + "epoch": 0.11286329879893646, + "learning_rate": 0.0001774291739250023, + "loss": 0.8614, + "mean_token_accuracy": 0.7393056094646454, + "num_tokens": 28483382.0, + "step": 12310 + }, + { + "epoch": 0.1129549830384157, + "learning_rate": 0.00017741083707710647, + "loss": 0.8754, + "mean_token_accuracy": 0.7461185574531555, + "num_tokens": 28506229.0, + "step": 12320 + }, + { + "epoch": 0.11304666727789493, + "learning_rate": 0.0001773925002292106, + "loss": 0.9038, + "mean_token_accuracy": 0.7372637808322906, + "num_tokens": 28529589.0, + "step": 12330 + }, + { + "epoch": 0.11313835151737417, + "learning_rate": 0.00017737416338131477, + "loss": 0.8848, + "mean_token_accuracy": 0.7373740017414093, + "num_tokens": 28552097.0, + "step": 12340 + }, + { + "epoch": 0.11323003575685339, + "learning_rate": 0.0001773558265334189, + "loss": 0.8685, + "mean_token_accuracy": 0.7405568540096283, + "num_tokens": 28575170.0, + "step": 12350 + }, + { + "epoch": 0.11332171999633263, + "learning_rate": 0.00017733748968552307, + "loss": 0.8486, + "mean_token_accuracy": 0.744938200712204, + "num_tokens": 28597896.0, + "step": 12360 + }, + { + "epoch": 0.11341340423581187, + "learning_rate": 0.0001773191528376272, + "loss": 0.8618, + "mean_token_accuracy": 0.7475294947624207, + "num_tokens": 28620245.0, + "step": 12370 + }, + { + "epoch": 0.1135050884752911, + "learning_rate": 0.00017730081598973138, + "loss": 0.8944, + "mean_token_accuracy": 0.7386161625385285, + "num_tokens": 28643082.0, + "step": 12380 + }, + { + "epoch": 0.11359677271477032, + "learning_rate": 0.00017728247914183554, + "loss": 0.8798, + "mean_token_accuracy": 0.7405800342559814, + "num_tokens": 28666153.0, + "step": 12390 + }, + { + "epoch": 0.11368845695424956, + "learning_rate": 0.00017726414229393968, + "loss": 0.8729, + "mean_token_accuracy": 0.7414615154266357, + "num_tokens": 28689137.0, + "step": 12400 + }, + { + "epoch": 0.1137801411937288, + "learning_rate": 0.00017724580544604385, + "loss": 0.8648, + "mean_token_accuracy": 0.7416299939155578, + "num_tokens": 28713125.0, + "step": 12410 + }, + { + "epoch": 0.11387182543320803, + "learning_rate": 0.00017722746859814799, + "loss": 0.8854, + "mean_token_accuracy": 0.74670529961586, + "num_tokens": 28736225.0, + "step": 12420 + }, + { + "epoch": 0.11396350967268727, + "learning_rate": 0.00017720913175025212, + "loss": 0.8994, + "mean_token_accuracy": 0.736379188299179, + "num_tokens": 28758825.0, + "step": 12430 + }, + { + "epoch": 0.1140551939121665, + "learning_rate": 0.0001771907949023563, + "loss": 0.8572, + "mean_token_accuracy": 0.742750632762909, + "num_tokens": 28782712.0, + "step": 12440 + }, + { + "epoch": 0.11414687815164573, + "learning_rate": 0.00017717245805446045, + "loss": 0.8845, + "mean_token_accuracy": 0.737398874759674, + "num_tokens": 28805646.0, + "step": 12450 + }, + { + "epoch": 0.11423856239112497, + "learning_rate": 0.0001771541212065646, + "loss": 0.8893, + "mean_token_accuracy": 0.736296546459198, + "num_tokens": 28828809.0, + "step": 12460 + }, + { + "epoch": 0.1143302466306042, + "learning_rate": 0.00017713578435866876, + "loss": 0.8651, + "mean_token_accuracy": 0.743328982591629, + "num_tokens": 28851700.0, + "step": 12470 + }, + { + "epoch": 0.11442193087008343, + "learning_rate": 0.0001771174475107729, + "loss": 0.8658, + "mean_token_accuracy": 0.7449788212776184, + "num_tokens": 28874778.0, + "step": 12480 + }, + { + "epoch": 0.11451361510956266, + "learning_rate": 0.00017709911066287706, + "loss": 0.8932, + "mean_token_accuracy": 0.7372696399688721, + "num_tokens": 28897409.0, + "step": 12490 + }, + { + "epoch": 0.1146052993490419, + "learning_rate": 0.0001770807738149812, + "loss": 0.8597, + "mean_token_accuracy": 0.7413606107234955, + "num_tokens": 28920429.0, + "step": 12500 + }, + { + "epoch": 0.11469698358852114, + "learning_rate": 0.00017706243696708537, + "loss": 0.8942, + "mean_token_accuracy": 0.7346774339675903, + "num_tokens": 28943335.0, + "step": 12510 + }, + { + "epoch": 0.11478866782800037, + "learning_rate": 0.00017704410011918953, + "loss": 0.906, + "mean_token_accuracy": 0.738807737827301, + "num_tokens": 28966256.0, + "step": 12520 + }, + { + "epoch": 0.1148803520674796, + "learning_rate": 0.00017702576327129367, + "loss": 0.9194, + "mean_token_accuracy": 0.7317074060440063, + "num_tokens": 28989502.0, + "step": 12530 + }, + { + "epoch": 0.11497203630695883, + "learning_rate": 0.00017700742642339783, + "loss": 0.9073, + "mean_token_accuracy": 0.7361348927021026, + "num_tokens": 29012615.0, + "step": 12540 + }, + { + "epoch": 0.11506372054643807, + "learning_rate": 0.00017698908957550197, + "loss": 0.899, + "mean_token_accuracy": 0.7338710904121399, + "num_tokens": 29036250.0, + "step": 12550 + }, + { + "epoch": 0.1151554047859173, + "learning_rate": 0.00017697075272760614, + "loss": 0.8771, + "mean_token_accuracy": 0.7368703424930573, + "num_tokens": 29060229.0, + "step": 12560 + }, + { + "epoch": 0.11524708902539653, + "learning_rate": 0.00017695241587971028, + "loss": 0.8591, + "mean_token_accuracy": 0.7381478071212768, + "num_tokens": 29082833.0, + "step": 12570 + }, + { + "epoch": 0.11533877326487577, + "learning_rate": 0.00017693407903181444, + "loss": 0.8957, + "mean_token_accuracy": 0.7396318912506104, + "num_tokens": 29105956.0, + "step": 12580 + }, + { + "epoch": 0.115430457504355, + "learning_rate": 0.0001769157421839186, + "loss": 0.904, + "mean_token_accuracy": 0.7330422759056091, + "num_tokens": 29129058.0, + "step": 12590 + }, + { + "epoch": 0.11552214174383424, + "learning_rate": 0.00017689740533602275, + "loss": 0.8699, + "mean_token_accuracy": 0.7421502351760865, + "num_tokens": 29152454.0, + "step": 12600 + }, + { + "epoch": 0.11561382598331346, + "learning_rate": 0.0001768790684881269, + "loss": 0.8858, + "mean_token_accuracy": 0.7383241057395935, + "num_tokens": 29176404.0, + "step": 12610 + }, + { + "epoch": 0.1157055102227927, + "learning_rate": 0.00017686073164023105, + "loss": 0.8629, + "mean_token_accuracy": 0.7425327897071838, + "num_tokens": 29199327.0, + "step": 12620 + }, + { + "epoch": 0.11579719446227194, + "learning_rate": 0.0001768423947923352, + "loss": 0.8878, + "mean_token_accuracy": 0.7418642282485962, + "num_tokens": 29222644.0, + "step": 12630 + }, + { + "epoch": 0.11588887870175117, + "learning_rate": 0.00017682405794443938, + "loss": 0.8574, + "mean_token_accuracy": 0.7389842867851257, + "num_tokens": 29245584.0, + "step": 12640 + }, + { + "epoch": 0.11598056294123041, + "learning_rate": 0.00017680572109654352, + "loss": 0.8446, + "mean_token_accuracy": 0.7447432279586792, + "num_tokens": 29268366.0, + "step": 12650 + }, + { + "epoch": 0.11607224718070963, + "learning_rate": 0.00017678738424864766, + "loss": 0.8932, + "mean_token_accuracy": 0.731689739227295, + "num_tokens": 29292046.0, + "step": 12660 + }, + { + "epoch": 0.11616393142018887, + "learning_rate": 0.00017676904740075182, + "loss": 0.8623, + "mean_token_accuracy": 0.7423143684864044, + "num_tokens": 29314600.0, + "step": 12670 + }, + { + "epoch": 0.1162556156596681, + "learning_rate": 0.00017675071055285596, + "loss": 0.8952, + "mean_token_accuracy": 0.733033561706543, + "num_tokens": 29338132.0, + "step": 12680 + }, + { + "epoch": 0.11634729989914734, + "learning_rate": 0.00017673237370496013, + "loss": 0.8266, + "mean_token_accuracy": 0.7551371455192566, + "num_tokens": 29362224.0, + "step": 12690 + }, + { + "epoch": 0.11643898413862656, + "learning_rate": 0.00017671403685706426, + "loss": 0.8902, + "mean_token_accuracy": 0.7397430539131165, + "num_tokens": 29384588.0, + "step": 12700 + }, + { + "epoch": 0.1165306683781058, + "learning_rate": 0.00017669570000916843, + "loss": 0.881, + "mean_token_accuracy": 0.7354751825332642, + "num_tokens": 29408007.0, + "step": 12710 + }, + { + "epoch": 0.11662235261758504, + "learning_rate": 0.0001766773631612726, + "loss": 0.8831, + "mean_token_accuracy": 0.741284316778183, + "num_tokens": 29430634.0, + "step": 12720 + }, + { + "epoch": 0.11671403685706427, + "learning_rate": 0.00017665902631337673, + "loss": 0.8712, + "mean_token_accuracy": 0.7477241635322571, + "num_tokens": 29453603.0, + "step": 12730 + }, + { + "epoch": 0.11680572109654351, + "learning_rate": 0.0001766406894654809, + "loss": 0.8891, + "mean_token_accuracy": 0.7399328410625458, + "num_tokens": 29477245.0, + "step": 12740 + }, + { + "epoch": 0.11689740533602273, + "learning_rate": 0.00017662235261758504, + "loss": 0.867, + "mean_token_accuracy": 0.738675570487976, + "num_tokens": 29500502.0, + "step": 12750 + }, + { + "epoch": 0.11698908957550197, + "learning_rate": 0.0001766040157696892, + "loss": 0.8714, + "mean_token_accuracy": 0.745803713798523, + "num_tokens": 29523209.0, + "step": 12760 + }, + { + "epoch": 0.1170807738149812, + "learning_rate": 0.00017658567892179337, + "loss": 0.8471, + "mean_token_accuracy": 0.743337082862854, + "num_tokens": 29545777.0, + "step": 12770 + }, + { + "epoch": 0.11717245805446044, + "learning_rate": 0.0001765673420738975, + "loss": 0.8358, + "mean_token_accuracy": 0.7475039005279541, + "num_tokens": 29569322.0, + "step": 12780 + }, + { + "epoch": 0.11726414229393967, + "learning_rate": 0.00017654900522600167, + "loss": 0.9131, + "mean_token_accuracy": 0.7342238783836365, + "num_tokens": 29592371.0, + "step": 12790 + }, + { + "epoch": 0.1173558265334189, + "learning_rate": 0.0001765306683781058, + "loss": 0.8874, + "mean_token_accuracy": 0.7430296838283539, + "num_tokens": 29615364.0, + "step": 12800 + }, + { + "epoch": 0.11744751077289814, + "learning_rate": 0.00017651233153020998, + "loss": 0.8642, + "mean_token_accuracy": 0.7376182734966278, + "num_tokens": 29638438.0, + "step": 12810 + }, + { + "epoch": 0.11753919501237738, + "learning_rate": 0.00017649399468231411, + "loss": 0.8634, + "mean_token_accuracy": 0.7459731817245483, + "num_tokens": 29661365.0, + "step": 12820 + }, + { + "epoch": 0.11763087925185661, + "learning_rate": 0.00017647565783441825, + "loss": 0.8524, + "mean_token_accuracy": 0.742122745513916, + "num_tokens": 29685258.0, + "step": 12830 + }, + { + "epoch": 0.11772256349133584, + "learning_rate": 0.00017645732098652244, + "loss": 0.8673, + "mean_token_accuracy": 0.7420704424381256, + "num_tokens": 29708804.0, + "step": 12840 + }, + { + "epoch": 0.11781424773081507, + "learning_rate": 0.00017643898413862658, + "loss": 0.8571, + "mean_token_accuracy": 0.745457673072815, + "num_tokens": 29732101.0, + "step": 12850 + }, + { + "epoch": 0.11790593197029431, + "learning_rate": 0.00017642064729073072, + "loss": 0.8712, + "mean_token_accuracy": 0.7470958411693573, + "num_tokens": 29755433.0, + "step": 12860 + }, + { + "epoch": 0.11799761620977355, + "learning_rate": 0.0001764023104428349, + "loss": 0.8634, + "mean_token_accuracy": 0.7413121581077575, + "num_tokens": 29778250.0, + "step": 12870 + }, + { + "epoch": 0.11808930044925277, + "learning_rate": 0.00017638397359493903, + "loss": 0.8634, + "mean_token_accuracy": 0.7354129433631897, + "num_tokens": 29800997.0, + "step": 12880 + }, + { + "epoch": 0.118180984688732, + "learning_rate": 0.0001763656367470432, + "loss": 0.883, + "mean_token_accuracy": 0.7436269700527192, + "num_tokens": 29824078.0, + "step": 12890 + }, + { + "epoch": 0.11827266892821124, + "learning_rate": 0.00017634729989914736, + "loss": 0.8747, + "mean_token_accuracy": 0.7435226678848267, + "num_tokens": 29847400.0, + "step": 12900 + }, + { + "epoch": 0.11836435316769048, + "learning_rate": 0.0001763289630512515, + "loss": 0.8906, + "mean_token_accuracy": 0.7374583840370178, + "num_tokens": 29870619.0, + "step": 12910 + }, + { + "epoch": 0.1184560374071697, + "learning_rate": 0.00017631062620335566, + "loss": 0.8614, + "mean_token_accuracy": 0.7423339128494263, + "num_tokens": 29893367.0, + "step": 12920 + }, + { + "epoch": 0.11854772164664894, + "learning_rate": 0.0001762922893554598, + "loss": 0.8405, + "mean_token_accuracy": 0.7501285612583161, + "num_tokens": 29916432.0, + "step": 12930 + }, + { + "epoch": 0.11863940588612817, + "learning_rate": 0.00017627395250756396, + "loss": 0.8442, + "mean_token_accuracy": 0.7497082769870758, + "num_tokens": 29939826.0, + "step": 12940 + }, + { + "epoch": 0.11873109012560741, + "learning_rate": 0.0001762556156596681, + "loss": 0.8713, + "mean_token_accuracy": 0.7454786598682404, + "num_tokens": 29962629.0, + "step": 12950 + }, + { + "epoch": 0.11882277436508665, + "learning_rate": 0.00017623727881177227, + "loss": 0.904, + "mean_token_accuracy": 0.7302988648414612, + "num_tokens": 29985639.0, + "step": 12960 + }, + { + "epoch": 0.11891445860456587, + "learning_rate": 0.00017621894196387643, + "loss": 0.9112, + "mean_token_accuracy": 0.7313469231128693, + "num_tokens": 30009256.0, + "step": 12970 + }, + { + "epoch": 0.1190061428440451, + "learning_rate": 0.00017620060511598057, + "loss": 0.9059, + "mean_token_accuracy": 0.7313918471336365, + "num_tokens": 30032244.0, + "step": 12980 + }, + { + "epoch": 0.11909782708352434, + "learning_rate": 0.00017618226826808474, + "loss": 0.9034, + "mean_token_accuracy": 0.7358958899974823, + "num_tokens": 30055592.0, + "step": 12990 + }, + { + "epoch": 0.11918951132300358, + "learning_rate": 0.00017616393142018887, + "loss": 0.874, + "mean_token_accuracy": 0.7436038911342621, + "num_tokens": 30078678.0, + "step": 13000 + }, + { + "epoch": 0.1192811955624828, + "learning_rate": 0.00017614559457229304, + "loss": 0.8779, + "mean_token_accuracy": 0.7430507123470307, + "num_tokens": 30101997.0, + "step": 13010 + }, + { + "epoch": 0.11937287980196204, + "learning_rate": 0.00017612725772439718, + "loss": 0.8259, + "mean_token_accuracy": 0.7528484761714935, + "num_tokens": 30124331.0, + "step": 13020 + }, + { + "epoch": 0.11946456404144128, + "learning_rate": 0.00017610892087650134, + "loss": 0.8707, + "mean_token_accuracy": 0.7411357223987579, + "num_tokens": 30147264.0, + "step": 13030 + }, + { + "epoch": 0.11955624828092051, + "learning_rate": 0.0001760905840286055, + "loss": 0.8674, + "mean_token_accuracy": 0.7380927324295044, + "num_tokens": 30170073.0, + "step": 13040 + }, + { + "epoch": 0.11964793252039975, + "learning_rate": 0.00017607224718070965, + "loss": 0.8856, + "mean_token_accuracy": 0.7355506956577301, + "num_tokens": 30192745.0, + "step": 13050 + }, + { + "epoch": 0.11973961675987897, + "learning_rate": 0.00017605391033281379, + "loss": 0.8428, + "mean_token_accuracy": 0.7427493333816528, + "num_tokens": 30215875.0, + "step": 13060 + }, + { + "epoch": 0.11983130099935821, + "learning_rate": 0.00017603557348491795, + "loss": 0.8605, + "mean_token_accuracy": 0.7437385082244873, + "num_tokens": 30239109.0, + "step": 13070 + }, + { + "epoch": 0.11992298523883745, + "learning_rate": 0.0001760172366370221, + "loss": 0.8769, + "mean_token_accuracy": 0.7371023893356323, + "num_tokens": 30262296.0, + "step": 13080 + }, + { + "epoch": 0.12001466947831668, + "learning_rate": 0.00017599889978912626, + "loss": 0.8807, + "mean_token_accuracy": 0.738269716501236, + "num_tokens": 30284904.0, + "step": 13090 + }, + { + "epoch": 0.1201063537177959, + "learning_rate": 0.00017598056294123042, + "loss": 0.8923, + "mean_token_accuracy": 0.7340485513210296, + "num_tokens": 30307147.0, + "step": 13100 + }, + { + "epoch": 0.12019803795727514, + "learning_rate": 0.00017596222609333456, + "loss": 0.9074, + "mean_token_accuracy": 0.7378047645092011, + "num_tokens": 30330172.0, + "step": 13110 + }, + { + "epoch": 0.12028972219675438, + "learning_rate": 0.00017594388924543872, + "loss": 0.8571, + "mean_token_accuracy": 0.7424475669860839, + "num_tokens": 30353920.0, + "step": 13120 + }, + { + "epoch": 0.12038140643623362, + "learning_rate": 0.00017592555239754286, + "loss": 0.8817, + "mean_token_accuracy": 0.7396665096282959, + "num_tokens": 30377352.0, + "step": 13130 + }, + { + "epoch": 0.12047309067571285, + "learning_rate": 0.00017590721554964703, + "loss": 0.8495, + "mean_token_accuracy": 0.7445613801479339, + "num_tokens": 30400876.0, + "step": 13140 + }, + { + "epoch": 0.12056477491519207, + "learning_rate": 0.00017588887870175117, + "loss": 0.8619, + "mean_token_accuracy": 0.7434922993183136, + "num_tokens": 30423565.0, + "step": 13150 + }, + { + "epoch": 0.12065645915467131, + "learning_rate": 0.00017587054185385533, + "loss": 0.8326, + "mean_token_accuracy": 0.7550764858722687, + "num_tokens": 30446652.0, + "step": 13160 + }, + { + "epoch": 0.12074814339415055, + "learning_rate": 0.0001758522050059595, + "loss": 0.8812, + "mean_token_accuracy": 0.7392385125160217, + "num_tokens": 30469711.0, + "step": 13170 + }, + { + "epoch": 0.12083982763362978, + "learning_rate": 0.00017583386815806364, + "loss": 0.8876, + "mean_token_accuracy": 0.7452516674995422, + "num_tokens": 30493225.0, + "step": 13180 + }, + { + "epoch": 0.12093151187310901, + "learning_rate": 0.0001758155313101678, + "loss": 0.8668, + "mean_token_accuracy": 0.7458862066268921, + "num_tokens": 30516034.0, + "step": 13190 + }, + { + "epoch": 0.12102319611258824, + "learning_rate": 0.00017579719446227194, + "loss": 0.8811, + "mean_token_accuracy": 0.7418933987617493, + "num_tokens": 30540341.0, + "step": 13200 + }, + { + "epoch": 0.12111488035206748, + "learning_rate": 0.0001757788576143761, + "loss": 0.889, + "mean_token_accuracy": 0.7409767270088196, + "num_tokens": 30564017.0, + "step": 13210 + }, + { + "epoch": 0.12120656459154672, + "learning_rate": 0.00017576052076648024, + "loss": 0.8902, + "mean_token_accuracy": 0.7385667145252228, + "num_tokens": 30587035.0, + "step": 13220 + }, + { + "epoch": 0.12129824883102594, + "learning_rate": 0.0001757421839185844, + "loss": 0.8678, + "mean_token_accuracy": 0.7395294427871704, + "num_tokens": 30610000.0, + "step": 13230 + }, + { + "epoch": 0.12138993307050518, + "learning_rate": 0.00017572384707068857, + "loss": 0.8596, + "mean_token_accuracy": 0.7460544407367706, + "num_tokens": 30633790.0, + "step": 13240 + }, + { + "epoch": 0.12148161730998441, + "learning_rate": 0.0001757055102227927, + "loss": 0.8696, + "mean_token_accuracy": 0.7419677972793579, + "num_tokens": 30655745.0, + "step": 13250 + }, + { + "epoch": 0.12157330154946365, + "learning_rate": 0.00017568717337489685, + "loss": 0.9234, + "mean_token_accuracy": 0.7229511618614197, + "num_tokens": 30678999.0, + "step": 13260 + }, + { + "epoch": 0.12166498578894289, + "learning_rate": 0.00017566883652700102, + "loss": 0.9156, + "mean_token_accuracy": 0.7283031642436981, + "num_tokens": 30701931.0, + "step": 13270 + }, + { + "epoch": 0.12175667002842211, + "learning_rate": 0.00017565049967910515, + "loss": 0.8696, + "mean_token_accuracy": 0.7463475167751312, + "num_tokens": 30725960.0, + "step": 13280 + }, + { + "epoch": 0.12184835426790135, + "learning_rate": 0.00017563216283120932, + "loss": 0.903, + "mean_token_accuracy": 0.7365835070610046, + "num_tokens": 30749486.0, + "step": 13290 + }, + { + "epoch": 0.12194003850738058, + "learning_rate": 0.00017561382598331348, + "loss": 0.8559, + "mean_token_accuracy": 0.7459181606769562, + "num_tokens": 30772928.0, + "step": 13300 + }, + { + "epoch": 0.12203172274685982, + "learning_rate": 0.00017559548913541762, + "loss": 0.8935, + "mean_token_accuracy": 0.7427541315555573, + "num_tokens": 30795424.0, + "step": 13310 + }, + { + "epoch": 0.12212340698633904, + "learning_rate": 0.0001755771522875218, + "loss": 0.8668, + "mean_token_accuracy": 0.7493497610092164, + "num_tokens": 30817827.0, + "step": 13320 + }, + { + "epoch": 0.12221509122581828, + "learning_rate": 0.00017555881543962593, + "loss": 0.9287, + "mean_token_accuracy": 0.7289869010448455, + "num_tokens": 30840847.0, + "step": 13330 + }, + { + "epoch": 0.12230677546529752, + "learning_rate": 0.0001755404785917301, + "loss": 0.8713, + "mean_token_accuracy": 0.7393110394477844, + "num_tokens": 30863622.0, + "step": 13340 + }, + { + "epoch": 0.12239845970477675, + "learning_rate": 0.00017552214174383423, + "loss": 0.8588, + "mean_token_accuracy": 0.7428774952888488, + "num_tokens": 30886248.0, + "step": 13350 + }, + { + "epoch": 0.12249014394425599, + "learning_rate": 0.0001755038048959384, + "loss": 0.9237, + "mean_token_accuracy": 0.7274897336959839, + "num_tokens": 30910208.0, + "step": 13360 + }, + { + "epoch": 0.12258182818373521, + "learning_rate": 0.00017548546804804256, + "loss": 0.8977, + "mean_token_accuracy": 0.7355661809444427, + "num_tokens": 30932555.0, + "step": 13370 + }, + { + "epoch": 0.12267351242321445, + "learning_rate": 0.0001754671312001467, + "loss": 0.8762, + "mean_token_accuracy": 0.741988730430603, + "num_tokens": 30955296.0, + "step": 13380 + }, + { + "epoch": 0.12276519666269368, + "learning_rate": 0.00017544879435225087, + "loss": 0.844, + "mean_token_accuracy": 0.7488784313201904, + "num_tokens": 30977767.0, + "step": 13390 + }, + { + "epoch": 0.12285688090217292, + "learning_rate": 0.000175430457504355, + "loss": 0.8796, + "mean_token_accuracy": 0.7436460018157959, + "num_tokens": 31001079.0, + "step": 13400 + }, + { + "epoch": 0.12294856514165214, + "learning_rate": 0.00017541212065645917, + "loss": 0.8936, + "mean_token_accuracy": 0.7348134934902191, + "num_tokens": 31023951.0, + "step": 13410 + }, + { + "epoch": 0.12304024938113138, + "learning_rate": 0.0001753937838085633, + "loss": 0.8382, + "mean_token_accuracy": 0.7484686076641083, + "num_tokens": 31046813.0, + "step": 13420 + }, + { + "epoch": 0.12313193362061062, + "learning_rate": 0.00017537544696066747, + "loss": 0.8896, + "mean_token_accuracy": 0.7325926005840302, + "num_tokens": 31069636.0, + "step": 13430 + }, + { + "epoch": 0.12322361786008985, + "learning_rate": 0.00017535711011277164, + "loss": 0.8812, + "mean_token_accuracy": 0.7350605428218842, + "num_tokens": 31092806.0, + "step": 13440 + }, + { + "epoch": 0.12331530209956909, + "learning_rate": 0.00017533877326487578, + "loss": 0.8582, + "mean_token_accuracy": 0.7459491133689881, + "num_tokens": 31115851.0, + "step": 13450 + }, + { + "epoch": 0.12340698633904831, + "learning_rate": 0.00017532043641697991, + "loss": 0.8861, + "mean_token_accuracy": 0.7331504344940185, + "num_tokens": 31138514.0, + "step": 13460 + }, + { + "epoch": 0.12349867057852755, + "learning_rate": 0.00017530209956908408, + "loss": 0.8733, + "mean_token_accuracy": 0.7477503836154937, + "num_tokens": 31161440.0, + "step": 13470 + }, + { + "epoch": 0.12359035481800679, + "learning_rate": 0.00017528376272118822, + "loss": 0.8845, + "mean_token_accuracy": 0.732633912563324, + "num_tokens": 31184423.0, + "step": 13480 + }, + { + "epoch": 0.12368203905748602, + "learning_rate": 0.0001752654258732924, + "loss": 0.8959, + "mean_token_accuracy": 0.7294002056121827, + "num_tokens": 31207404.0, + "step": 13490 + }, + { + "epoch": 0.12377372329696525, + "learning_rate": 0.00017524708902539655, + "loss": 0.8831, + "mean_token_accuracy": 0.7389393508434295, + "num_tokens": 31230643.0, + "step": 13500 + }, + { + "epoch": 0.12386540753644448, + "learning_rate": 0.0001752287521775007, + "loss": 0.8585, + "mean_token_accuracy": 0.7482302010059356, + "num_tokens": 31254253.0, + "step": 13510 + }, + { + "epoch": 0.12395709177592372, + "learning_rate": 0.00017521041532960485, + "loss": 0.912, + "mean_token_accuracy": 0.7345802307128906, + "num_tokens": 31276987.0, + "step": 13520 + }, + { + "epoch": 0.12404877601540296, + "learning_rate": 0.000175192078481709, + "loss": 0.8782, + "mean_token_accuracy": 0.7386352062225342, + "num_tokens": 31300638.0, + "step": 13530 + }, + { + "epoch": 0.12414046025488218, + "learning_rate": 0.00017517374163381316, + "loss": 0.8629, + "mean_token_accuracy": 0.7417355597019195, + "num_tokens": 31324326.0, + "step": 13540 + }, + { + "epoch": 0.12423214449436142, + "learning_rate": 0.0001751554047859173, + "loss": 0.871, + "mean_token_accuracy": 0.7393722474575043, + "num_tokens": 31348317.0, + "step": 13550 + }, + { + "epoch": 0.12432382873384065, + "learning_rate": 0.00017513706793802146, + "loss": 0.9122, + "mean_token_accuracy": 0.7346632480621338, + "num_tokens": 31371033.0, + "step": 13560 + }, + { + "epoch": 0.12441551297331989, + "learning_rate": 0.00017511873109012563, + "loss": 0.8524, + "mean_token_accuracy": 0.7437283635139466, + "num_tokens": 31394548.0, + "step": 13570 + }, + { + "epoch": 0.12450719721279913, + "learning_rate": 0.00017510039424222976, + "loss": 0.8577, + "mean_token_accuracy": 0.7488535881042481, + "num_tokens": 31417408.0, + "step": 13580 + }, + { + "epoch": 0.12459888145227835, + "learning_rate": 0.00017508205739433393, + "loss": 0.8886, + "mean_token_accuracy": 0.7315831184387207, + "num_tokens": 31439844.0, + "step": 13590 + }, + { + "epoch": 0.12469056569175758, + "learning_rate": 0.00017506372054643807, + "loss": 0.8789, + "mean_token_accuracy": 0.7398853242397309, + "num_tokens": 31464053.0, + "step": 13600 + }, + { + "epoch": 0.12478224993123682, + "learning_rate": 0.00017504538369854223, + "loss": 0.9049, + "mean_token_accuracy": 0.7342214941978454, + "num_tokens": 31487565.0, + "step": 13610 + }, + { + "epoch": 0.12487393417071606, + "learning_rate": 0.0001750270468506464, + "loss": 0.8835, + "mean_token_accuracy": 0.7285666584968566, + "num_tokens": 31511006.0, + "step": 13620 + }, + { + "epoch": 0.12496561841019528, + "learning_rate": 0.00017500871000275054, + "loss": 0.882, + "mean_token_accuracy": 0.7379772901535034, + "num_tokens": 31534480.0, + "step": 13630 + }, + { + "epoch": 0.12505730264967452, + "learning_rate": 0.0001749903731548547, + "loss": 0.8741, + "mean_token_accuracy": 0.7383758902549744, + "num_tokens": 31557449.0, + "step": 13640 + }, + { + "epoch": 0.12514898688915377, + "learning_rate": 0.00017497203630695884, + "loss": 0.8883, + "mean_token_accuracy": 0.7329118847846985, + "num_tokens": 31581519.0, + "step": 13650 + }, + { + "epoch": 0.125240671128633, + "learning_rate": 0.00017495369945906298, + "loss": 0.8653, + "mean_token_accuracy": 0.7431224584579468, + "num_tokens": 31603877.0, + "step": 13660 + }, + { + "epoch": 0.1253323553681122, + "learning_rate": 0.00017493536261116714, + "loss": 0.8817, + "mean_token_accuracy": 0.7401574850082397, + "num_tokens": 31627032.0, + "step": 13670 + }, + { + "epoch": 0.12542403960759146, + "learning_rate": 0.00017491702576327128, + "loss": 0.8452, + "mean_token_accuracy": 0.7415537536144257, + "num_tokens": 31650209.0, + "step": 13680 + }, + { + "epoch": 0.1255157238470707, + "learning_rate": 0.00017489868891537548, + "loss": 0.8795, + "mean_token_accuracy": 0.7378593504428863, + "num_tokens": 31673550.0, + "step": 13690 + }, + { + "epoch": 0.1256074080865499, + "learning_rate": 0.00017488035206747961, + "loss": 0.8472, + "mean_token_accuracy": 0.7466789901256561, + "num_tokens": 31696646.0, + "step": 13700 + }, + { + "epoch": 0.12569909232602916, + "learning_rate": 0.00017486201521958375, + "loss": 0.8369, + "mean_token_accuracy": 0.7511944532394409, + "num_tokens": 31719187.0, + "step": 13710 + }, + { + "epoch": 0.12579077656550838, + "learning_rate": 0.00017484367837168792, + "loss": 0.881, + "mean_token_accuracy": 0.7432884573936462, + "num_tokens": 31742580.0, + "step": 13720 + }, + { + "epoch": 0.12588246080498763, + "learning_rate": 0.00017482534152379206, + "loss": 0.8598, + "mean_token_accuracy": 0.7441620707511902, + "num_tokens": 31765975.0, + "step": 13730 + }, + { + "epoch": 0.12597414504446686, + "learning_rate": 0.00017480700467589622, + "loss": 0.9079, + "mean_token_accuracy": 0.7359534800052643, + "num_tokens": 31789434.0, + "step": 13740 + }, + { + "epoch": 0.12606582928394608, + "learning_rate": 0.0001747886678280004, + "loss": 0.8799, + "mean_token_accuracy": 0.7369920551776886, + "num_tokens": 31812985.0, + "step": 13750 + }, + { + "epoch": 0.12615751352342533, + "learning_rate": 0.00017477033098010453, + "loss": 0.8825, + "mean_token_accuracy": 0.7377887725830078, + "num_tokens": 31835774.0, + "step": 13760 + }, + { + "epoch": 0.12624919776290455, + "learning_rate": 0.0001747519941322087, + "loss": 0.8391, + "mean_token_accuracy": 0.7521439611911773, + "num_tokens": 31859100.0, + "step": 13770 + }, + { + "epoch": 0.1263408820023838, + "learning_rate": 0.00017473365728431283, + "loss": 0.874, + "mean_token_accuracy": 0.7330224096775055, + "num_tokens": 31882262.0, + "step": 13780 + }, + { + "epoch": 0.12643256624186303, + "learning_rate": 0.000174715320436417, + "loss": 0.9049, + "mean_token_accuracy": 0.734117305278778, + "num_tokens": 31905080.0, + "step": 13790 + }, + { + "epoch": 0.12652425048134225, + "learning_rate": 0.00017469698358852113, + "loss": 0.8465, + "mean_token_accuracy": 0.744682377576828, + "num_tokens": 31927947.0, + "step": 13800 + }, + { + "epoch": 0.1266159347208215, + "learning_rate": 0.0001746786467406253, + "loss": 0.8979, + "mean_token_accuracy": 0.7385300934314728, + "num_tokens": 31950836.0, + "step": 13810 + }, + { + "epoch": 0.12670761896030072, + "learning_rate": 0.00017466030989272946, + "loss": 0.8692, + "mean_token_accuracy": 0.7386554837226867, + "num_tokens": 31973742.0, + "step": 13820 + }, + { + "epoch": 0.12679930319977994, + "learning_rate": 0.0001746419730448336, + "loss": 0.8467, + "mean_token_accuracy": 0.7460804641246795, + "num_tokens": 31996494.0, + "step": 13830 + }, + { + "epoch": 0.1268909874392592, + "learning_rate": 0.00017462363619693777, + "loss": 0.9014, + "mean_token_accuracy": 0.7330855011940003, + "num_tokens": 32019415.0, + "step": 13840 + }, + { + "epoch": 0.12698267167873842, + "learning_rate": 0.0001746052993490419, + "loss": 0.8693, + "mean_token_accuracy": 0.7430007636547089, + "num_tokens": 32043083.0, + "step": 13850 + }, + { + "epoch": 0.12707435591821767, + "learning_rate": 0.00017458696250114604, + "loss": 0.8624, + "mean_token_accuracy": 0.7419776797294617, + "num_tokens": 32065552.0, + "step": 13860 + }, + { + "epoch": 0.1271660401576969, + "learning_rate": 0.0001745686256532502, + "loss": 0.937, + "mean_token_accuracy": 0.7287083685398101, + "num_tokens": 32088367.0, + "step": 13870 + }, + { + "epoch": 0.12725772439717611, + "learning_rate": 0.00017455028880535437, + "loss": 0.925, + "mean_token_accuracy": 0.7303915798664093, + "num_tokens": 32110728.0, + "step": 13880 + }, + { + "epoch": 0.12734940863665536, + "learning_rate": 0.00017453195195745854, + "loss": 0.8545, + "mean_token_accuracy": 0.7415268540382385, + "num_tokens": 32134295.0, + "step": 13890 + }, + { + "epoch": 0.1274410928761346, + "learning_rate": 0.00017451361510956268, + "loss": 0.8718, + "mean_token_accuracy": 0.7446969985961914, + "num_tokens": 32156688.0, + "step": 13900 + }, + { + "epoch": 0.12753277711561384, + "learning_rate": 0.00017449527826166682, + "loss": 0.8958, + "mean_token_accuracy": 0.7414741516113281, + "num_tokens": 32179971.0, + "step": 13910 + }, + { + "epoch": 0.12762446135509306, + "learning_rate": 0.00017447694141377098, + "loss": 0.8449, + "mean_token_accuracy": 0.7451531112194061, + "num_tokens": 32202781.0, + "step": 13920 + }, + { + "epoch": 0.12771614559457228, + "learning_rate": 0.00017445860456587512, + "loss": 0.8658, + "mean_token_accuracy": 0.7495111107826233, + "num_tokens": 32225524.0, + "step": 13930 + }, + { + "epoch": 0.12780782983405153, + "learning_rate": 0.00017444026771797929, + "loss": 0.8796, + "mean_token_accuracy": 0.7446104109287262, + "num_tokens": 32248427.0, + "step": 13940 + }, + { + "epoch": 0.12789951407353076, + "learning_rate": 0.00017442193087008345, + "loss": 0.9104, + "mean_token_accuracy": 0.7278967261314392, + "num_tokens": 32271092.0, + "step": 13950 + }, + { + "epoch": 0.12799119831301, + "learning_rate": 0.0001744035940221876, + "loss": 0.9051, + "mean_token_accuracy": 0.7343689262866974, + "num_tokens": 32294127.0, + "step": 13960 + }, + { + "epoch": 0.12808288255248923, + "learning_rate": 0.00017438525717429175, + "loss": 0.8598, + "mean_token_accuracy": 0.7487718880176544, + "num_tokens": 32316594.0, + "step": 13970 + }, + { + "epoch": 0.12817456679196845, + "learning_rate": 0.0001743669203263959, + "loss": 0.9167, + "mean_token_accuracy": 0.7296574294567109, + "num_tokens": 32340409.0, + "step": 13980 + }, + { + "epoch": 0.1282662510314477, + "learning_rate": 0.00017434858347850006, + "loss": 0.8711, + "mean_token_accuracy": 0.743960189819336, + "num_tokens": 32363980.0, + "step": 13990 + }, + { + "epoch": 0.12835793527092693, + "learning_rate": 0.0001743302466306042, + "loss": 0.9075, + "mean_token_accuracy": 0.7316538751125335, + "num_tokens": 32386796.0, + "step": 14000 + }, + { + "epoch": 0.12844961951040615, + "learning_rate": 0.00017431190978270836, + "loss": 0.852, + "mean_token_accuracy": 0.7484723925590515, + "num_tokens": 32410086.0, + "step": 14010 + }, + { + "epoch": 0.1285413037498854, + "learning_rate": 0.00017429357293481253, + "loss": 0.8397, + "mean_token_accuracy": 0.7521367490291595, + "num_tokens": 32432378.0, + "step": 14020 + }, + { + "epoch": 0.12863298798936462, + "learning_rate": 0.00017427523608691667, + "loss": 0.9017, + "mean_token_accuracy": 0.7342784345149994, + "num_tokens": 32454976.0, + "step": 14030 + }, + { + "epoch": 0.12872467222884387, + "learning_rate": 0.00017425689923902083, + "loss": 0.8686, + "mean_token_accuracy": 0.7416263163089752, + "num_tokens": 32477821.0, + "step": 14040 + }, + { + "epoch": 0.1288163564683231, + "learning_rate": 0.00017423856239112497, + "loss": 0.893, + "mean_token_accuracy": 0.7359785735607147, + "num_tokens": 32501400.0, + "step": 14050 + }, + { + "epoch": 0.12890804070780232, + "learning_rate": 0.0001742202255432291, + "loss": 0.8906, + "mean_token_accuracy": 0.7366522014141083, + "num_tokens": 32524581.0, + "step": 14060 + }, + { + "epoch": 0.12899972494728157, + "learning_rate": 0.00017420188869533327, + "loss": 0.8726, + "mean_token_accuracy": 0.7413610994815827, + "num_tokens": 32546892.0, + "step": 14070 + }, + { + "epoch": 0.1290914091867608, + "learning_rate": 0.00017418355184743744, + "loss": 0.8903, + "mean_token_accuracy": 0.7370317041873932, + "num_tokens": 32570582.0, + "step": 14080 + }, + { + "epoch": 0.12918309342624004, + "learning_rate": 0.0001741652149995416, + "loss": 0.8827, + "mean_token_accuracy": 0.7373828768730164, + "num_tokens": 32594207.0, + "step": 14090 + }, + { + "epoch": 0.12927477766571926, + "learning_rate": 0.00017414687815164574, + "loss": 0.8813, + "mean_token_accuracy": 0.7411800384521484, + "num_tokens": 32617335.0, + "step": 14100 + }, + { + "epoch": 0.1293664619051985, + "learning_rate": 0.00017412854130374988, + "loss": 0.8307, + "mean_token_accuracy": 0.7452889561653138, + "num_tokens": 32640265.0, + "step": 14110 + }, + { + "epoch": 0.12945814614467774, + "learning_rate": 0.00017411020445585405, + "loss": 0.8614, + "mean_token_accuracy": 0.7437470495700836, + "num_tokens": 32664621.0, + "step": 14120 + }, + { + "epoch": 0.12954983038415696, + "learning_rate": 0.00017409186760795818, + "loss": 0.8763, + "mean_token_accuracy": 0.7378992319107056, + "num_tokens": 32688438.0, + "step": 14130 + }, + { + "epoch": 0.12964151462363618, + "learning_rate": 0.00017407353076006238, + "loss": 0.8625, + "mean_token_accuracy": 0.7478434562683105, + "num_tokens": 32711422.0, + "step": 14140 + }, + { + "epoch": 0.12973319886311543, + "learning_rate": 0.00017405519391216652, + "loss": 0.8866, + "mean_token_accuracy": 0.7385292470455169, + "num_tokens": 32734443.0, + "step": 14150 + }, + { + "epoch": 0.12982488310259466, + "learning_rate": 0.00017403685706427065, + "loss": 0.8914, + "mean_token_accuracy": 0.7368983030319214, + "num_tokens": 32757880.0, + "step": 14160 + }, + { + "epoch": 0.1299165673420739, + "learning_rate": 0.00017401852021637482, + "loss": 0.8566, + "mean_token_accuracy": 0.7447448313236237, + "num_tokens": 32781375.0, + "step": 14170 + }, + { + "epoch": 0.13000825158155313, + "learning_rate": 0.00017400018336847896, + "loss": 0.8912, + "mean_token_accuracy": 0.7378781378269196, + "num_tokens": 32804014.0, + "step": 14180 + }, + { + "epoch": 0.13009993582103235, + "learning_rate": 0.00017398184652058312, + "loss": 0.8675, + "mean_token_accuracy": 0.744933158159256, + "num_tokens": 32827445.0, + "step": 14190 + }, + { + "epoch": 0.1301916200605116, + "learning_rate": 0.00017396350967268726, + "loss": 0.883, + "mean_token_accuracy": 0.7406885266304016, + "num_tokens": 32850833.0, + "step": 14200 + }, + { + "epoch": 0.13028330429999083, + "learning_rate": 0.00017394517282479143, + "loss": 0.8786, + "mean_token_accuracy": 0.7334289312362671, + "num_tokens": 32874270.0, + "step": 14210 + }, + { + "epoch": 0.13037498853947008, + "learning_rate": 0.0001739268359768956, + "loss": 0.87, + "mean_token_accuracy": 0.7492436230182647, + "num_tokens": 32897659.0, + "step": 14220 + }, + { + "epoch": 0.1304666727789493, + "learning_rate": 0.00017390849912899973, + "loss": 0.8896, + "mean_token_accuracy": 0.7279127836227417, + "num_tokens": 32920966.0, + "step": 14230 + }, + { + "epoch": 0.13055835701842852, + "learning_rate": 0.0001738901622811039, + "loss": 0.8707, + "mean_token_accuracy": 0.7412879467010498, + "num_tokens": 32942964.0, + "step": 14240 + }, + { + "epoch": 0.13065004125790777, + "learning_rate": 0.00017387182543320803, + "loss": 0.8905, + "mean_token_accuracy": 0.7424752235412597, + "num_tokens": 32966348.0, + "step": 14250 + }, + { + "epoch": 0.130741725497387, + "learning_rate": 0.00017385348858531217, + "loss": 0.8767, + "mean_token_accuracy": 0.7338845789432525, + "num_tokens": 32989647.0, + "step": 14260 + }, + { + "epoch": 0.13083340973686625, + "learning_rate": 0.00017383515173741637, + "loss": 0.9067, + "mean_token_accuracy": 0.7268571972846984, + "num_tokens": 33012854.0, + "step": 14270 + }, + { + "epoch": 0.13092509397634547, + "learning_rate": 0.0001738168148895205, + "loss": 0.8825, + "mean_token_accuracy": 0.7357637226581574, + "num_tokens": 33035560.0, + "step": 14280 + }, + { + "epoch": 0.1310167782158247, + "learning_rate": 0.00017379847804162467, + "loss": 0.8935, + "mean_token_accuracy": 0.739679080247879, + "num_tokens": 33058348.0, + "step": 14290 + }, + { + "epoch": 0.13110846245530394, + "learning_rate": 0.0001737801411937288, + "loss": 0.8915, + "mean_token_accuracy": 0.7366253197193146, + "num_tokens": 33081400.0, + "step": 14300 + }, + { + "epoch": 0.13120014669478317, + "learning_rate": 0.00017376180434583295, + "loss": 0.8934, + "mean_token_accuracy": 0.7382798731327057, + "num_tokens": 33104888.0, + "step": 14310 + }, + { + "epoch": 0.1312918309342624, + "learning_rate": 0.0001737434674979371, + "loss": 0.8634, + "mean_token_accuracy": 0.7401932656764985, + "num_tokens": 33128450.0, + "step": 14320 + }, + { + "epoch": 0.13138351517374164, + "learning_rate": 0.00017372513065004125, + "loss": 0.8823, + "mean_token_accuracy": 0.735636180639267, + "num_tokens": 33151650.0, + "step": 14330 + }, + { + "epoch": 0.13147519941322086, + "learning_rate": 0.00017370679380214544, + "loss": 0.8608, + "mean_token_accuracy": 0.7445764899253845, + "num_tokens": 33174893.0, + "step": 14340 + }, + { + "epoch": 0.1315668836527001, + "learning_rate": 0.00017368845695424958, + "loss": 0.9213, + "mean_token_accuracy": 0.7347506880760193, + "num_tokens": 33197781.0, + "step": 14350 + }, + { + "epoch": 0.13165856789217933, + "learning_rate": 0.00017367012010635372, + "loss": 0.8805, + "mean_token_accuracy": 0.7362947225570678, + "num_tokens": 33221135.0, + "step": 14360 + }, + { + "epoch": 0.13175025213165856, + "learning_rate": 0.00017365178325845788, + "loss": 0.8875, + "mean_token_accuracy": 0.7380826473236084, + "num_tokens": 33244067.0, + "step": 14370 + }, + { + "epoch": 0.1318419363711378, + "learning_rate": 0.00017363344641056202, + "loss": 0.8375, + "mean_token_accuracy": 0.7559607982635498, + "num_tokens": 33266712.0, + "step": 14380 + }, + { + "epoch": 0.13193362061061703, + "learning_rate": 0.0001736151095626662, + "loss": 0.9012, + "mean_token_accuracy": 0.7327978372573852, + "num_tokens": 33289080.0, + "step": 14390 + }, + { + "epoch": 0.13202530485009628, + "learning_rate": 0.00017359677271477033, + "loss": 0.8526, + "mean_token_accuracy": 0.7474592685699463, + "num_tokens": 33312643.0, + "step": 14400 + }, + { + "epoch": 0.1321169890895755, + "learning_rate": 0.0001735784358668745, + "loss": 0.8799, + "mean_token_accuracy": 0.7366613864898681, + "num_tokens": 33335828.0, + "step": 14410 + }, + { + "epoch": 0.13220867332905473, + "learning_rate": 0.00017356009901897866, + "loss": 0.8346, + "mean_token_accuracy": 0.7410920321941376, + "num_tokens": 33358712.0, + "step": 14420 + }, + { + "epoch": 0.13230035756853398, + "learning_rate": 0.0001735417621710828, + "loss": 0.9087, + "mean_token_accuracy": 0.7315150141716004, + "num_tokens": 33381941.0, + "step": 14430 + }, + { + "epoch": 0.1323920418080132, + "learning_rate": 0.00017352342532318696, + "loss": 0.8513, + "mean_token_accuracy": 0.746486222743988, + "num_tokens": 33404783.0, + "step": 14440 + }, + { + "epoch": 0.13248372604749242, + "learning_rate": 0.0001735050884752911, + "loss": 0.8657, + "mean_token_accuracy": 0.7400833129882812, + "num_tokens": 33428194.0, + "step": 14450 + }, + { + "epoch": 0.13257541028697167, + "learning_rate": 0.00017348675162739524, + "loss": 0.8727, + "mean_token_accuracy": 0.7396412909030914, + "num_tokens": 33451989.0, + "step": 14460 + }, + { + "epoch": 0.1326670945264509, + "learning_rate": 0.00017346841477949943, + "loss": 0.8861, + "mean_token_accuracy": 0.7379320859909058, + "num_tokens": 33475313.0, + "step": 14470 + }, + { + "epoch": 0.13275877876593015, + "learning_rate": 0.00017345007793160357, + "loss": 0.8577, + "mean_token_accuracy": 0.748997038602829, + "num_tokens": 33498554.0, + "step": 14480 + }, + { + "epoch": 0.13285046300540937, + "learning_rate": 0.00017343174108370773, + "loss": 0.8784, + "mean_token_accuracy": 0.7325134396553039, + "num_tokens": 33522514.0, + "step": 14490 + }, + { + "epoch": 0.1329421472448886, + "learning_rate": 0.00017341340423581187, + "loss": 0.8732, + "mean_token_accuracy": 0.7366645336151123, + "num_tokens": 33546435.0, + "step": 14500 + }, + { + "epoch": 0.13303383148436784, + "learning_rate": 0.000173395067387916, + "loss": 0.8552, + "mean_token_accuracy": 0.7399717330932617, + "num_tokens": 33568916.0, + "step": 14510 + }, + { + "epoch": 0.13312551572384707, + "learning_rate": 0.00017337673054002018, + "loss": 0.8993, + "mean_token_accuracy": 0.7399784088134765, + "num_tokens": 33591657.0, + "step": 14520 + }, + { + "epoch": 0.13321719996332632, + "learning_rate": 0.00017335839369212431, + "loss": 0.9011, + "mean_token_accuracy": 0.7350584924221039, + "num_tokens": 33614933.0, + "step": 14530 + }, + { + "epoch": 0.13330888420280554, + "learning_rate": 0.0001733400568442285, + "loss": 0.8839, + "mean_token_accuracy": 0.7400415539741516, + "num_tokens": 33638132.0, + "step": 14540 + }, + { + "epoch": 0.13340056844228476, + "learning_rate": 0.00017332171999633264, + "loss": 0.8462, + "mean_token_accuracy": 0.744160383939743, + "num_tokens": 33661575.0, + "step": 14550 + }, + { + "epoch": 0.133492252681764, + "learning_rate": 0.00017330338314843678, + "loss": 0.8713, + "mean_token_accuracy": 0.7381963133811951, + "num_tokens": 33684064.0, + "step": 14560 + }, + { + "epoch": 0.13358393692124323, + "learning_rate": 0.00017328504630054095, + "loss": 0.8592, + "mean_token_accuracy": 0.744098824262619, + "num_tokens": 33706846.0, + "step": 14570 + }, + { + "epoch": 0.13367562116072249, + "learning_rate": 0.0001732667094526451, + "loss": 0.8711, + "mean_token_accuracy": 0.7483438372611999, + "num_tokens": 33730542.0, + "step": 14580 + }, + { + "epoch": 0.1337673054002017, + "learning_rate": 0.00017324837260474925, + "loss": 0.8548, + "mean_token_accuracy": 0.7378258168697357, + "num_tokens": 33753327.0, + "step": 14590 + }, + { + "epoch": 0.13385898963968093, + "learning_rate": 0.00017323003575685342, + "loss": 0.8784, + "mean_token_accuracy": 0.737323272228241, + "num_tokens": 33775698.0, + "step": 14600 + }, + { + "epoch": 0.13395067387916018, + "learning_rate": 0.00017321169890895756, + "loss": 0.8636, + "mean_token_accuracy": 0.7428741157054901, + "num_tokens": 33798575.0, + "step": 14610 + }, + { + "epoch": 0.1340423581186394, + "learning_rate": 0.00017319336206106172, + "loss": 0.8901, + "mean_token_accuracy": 0.7395589411258697, + "num_tokens": 33821900.0, + "step": 14620 + }, + { + "epoch": 0.13413404235811863, + "learning_rate": 0.00017317502521316586, + "loss": 0.9027, + "mean_token_accuracy": 0.7431897580623626, + "num_tokens": 33844451.0, + "step": 14630 + }, + { + "epoch": 0.13422572659759788, + "learning_rate": 0.00017315668836527002, + "loss": 0.8767, + "mean_token_accuracy": 0.7426425874233246, + "num_tokens": 33867120.0, + "step": 14640 + }, + { + "epoch": 0.1343174108370771, + "learning_rate": 0.00017313835151737416, + "loss": 0.8865, + "mean_token_accuracy": 0.7388552486896515, + "num_tokens": 33891226.0, + "step": 14650 + }, + { + "epoch": 0.13440909507655635, + "learning_rate": 0.0001731200146694783, + "loss": 0.8871, + "mean_token_accuracy": 0.7396299719810486, + "num_tokens": 33914381.0, + "step": 14660 + }, + { + "epoch": 0.13450077931603557, + "learning_rate": 0.0001731016778215825, + "loss": 0.9021, + "mean_token_accuracy": 0.7366632640361785, + "num_tokens": 33937847.0, + "step": 14670 + }, + { + "epoch": 0.1345924635555148, + "learning_rate": 0.00017308334097368663, + "loss": 0.864, + "mean_token_accuracy": 0.7463048279285431, + "num_tokens": 33961142.0, + "step": 14680 + }, + { + "epoch": 0.13468414779499405, + "learning_rate": 0.0001730650041257908, + "loss": 0.9041, + "mean_token_accuracy": 0.7357403934001923, + "num_tokens": 33983978.0, + "step": 14690 + }, + { + "epoch": 0.13477583203447327, + "learning_rate": 0.00017304666727789494, + "loss": 0.8969, + "mean_token_accuracy": 0.7384519755840302, + "num_tokens": 34006363.0, + "step": 14700 + }, + { + "epoch": 0.13486751627395252, + "learning_rate": 0.00017302833042999907, + "loss": 0.8922, + "mean_token_accuracy": 0.7325655400753022, + "num_tokens": 34029506.0, + "step": 14710 + }, + { + "epoch": 0.13495920051343174, + "learning_rate": 0.00017300999358210324, + "loss": 0.8747, + "mean_token_accuracy": 0.7357029318809509, + "num_tokens": 34052710.0, + "step": 14720 + }, + { + "epoch": 0.13505088475291097, + "learning_rate": 0.0001729916567342074, + "loss": 0.9007, + "mean_token_accuracy": 0.7338222444057465, + "num_tokens": 34076247.0, + "step": 14730 + }, + { + "epoch": 0.13514256899239022, + "learning_rate": 0.00017297331988631157, + "loss": 0.8823, + "mean_token_accuracy": 0.7370768666267395, + "num_tokens": 34098953.0, + "step": 14740 + }, + { + "epoch": 0.13523425323186944, + "learning_rate": 0.0001729549830384157, + "loss": 0.9181, + "mean_token_accuracy": 0.7265935063362121, + "num_tokens": 34122802.0, + "step": 14750 + }, + { + "epoch": 0.13532593747134866, + "learning_rate": 0.00017293664619051985, + "loss": 0.8771, + "mean_token_accuracy": 0.7369015514850616, + "num_tokens": 34145898.0, + "step": 14760 + }, + { + "epoch": 0.1354176217108279, + "learning_rate": 0.000172918309342624, + "loss": 0.8535, + "mean_token_accuracy": 0.7423493146896363, + "num_tokens": 34169195.0, + "step": 14770 + }, + { + "epoch": 0.13550930595030714, + "learning_rate": 0.00017289997249472815, + "loss": 0.8726, + "mean_token_accuracy": 0.7451719880104065, + "num_tokens": 34192593.0, + "step": 14780 + }, + { + "epoch": 0.13560099018978639, + "learning_rate": 0.00017288163564683232, + "loss": 0.8826, + "mean_token_accuracy": 0.7411118149757385, + "num_tokens": 34215861.0, + "step": 14790 + }, + { + "epoch": 0.1356926744292656, + "learning_rate": 0.00017286329879893648, + "loss": 0.8551, + "mean_token_accuracy": 0.7451322019100189, + "num_tokens": 34238554.0, + "step": 14800 + }, + { + "epoch": 0.13578435866874483, + "learning_rate": 0.00017284496195104062, + "loss": 0.8379, + "mean_token_accuracy": 0.738130247592926, + "num_tokens": 34262443.0, + "step": 14810 + }, + { + "epoch": 0.13587604290822408, + "learning_rate": 0.00017282662510314479, + "loss": 0.9108, + "mean_token_accuracy": 0.7346627950668335, + "num_tokens": 34285167.0, + "step": 14820 + }, + { + "epoch": 0.1359677271477033, + "learning_rate": 0.00017280828825524892, + "loss": 0.8718, + "mean_token_accuracy": 0.7400343775749206, + "num_tokens": 34308781.0, + "step": 14830 + }, + { + "epoch": 0.13605941138718256, + "learning_rate": 0.0001727899514073531, + "loss": 0.8805, + "mean_token_accuracy": 0.7371185064315796, + "num_tokens": 34332493.0, + "step": 14840 + }, + { + "epoch": 0.13615109562666178, + "learning_rate": 0.00017277161455945723, + "loss": 0.8793, + "mean_token_accuracy": 0.7439113616943359, + "num_tokens": 34355974.0, + "step": 14850 + }, + { + "epoch": 0.136242779866141, + "learning_rate": 0.0001727532777115614, + "loss": 0.884, + "mean_token_accuracy": 0.7329540967941284, + "num_tokens": 34378899.0, + "step": 14860 + }, + { + "epoch": 0.13633446410562025, + "learning_rate": 0.00017273494086366556, + "loss": 0.8871, + "mean_token_accuracy": 0.7310245156288147, + "num_tokens": 34401704.0, + "step": 14870 + }, + { + "epoch": 0.13642614834509947, + "learning_rate": 0.0001727166040157697, + "loss": 0.858, + "mean_token_accuracy": 0.7442012190818786, + "num_tokens": 34424568.0, + "step": 14880 + }, + { + "epoch": 0.13651783258457872, + "learning_rate": 0.00017269826716787386, + "loss": 0.8618, + "mean_token_accuracy": 0.7480300724506378, + "num_tokens": 34447311.0, + "step": 14890 + }, + { + "epoch": 0.13660951682405795, + "learning_rate": 0.000172679930319978, + "loss": 0.8408, + "mean_token_accuracy": 0.7481724441051483, + "num_tokens": 34470874.0, + "step": 14900 + }, + { + "epoch": 0.13670120106353717, + "learning_rate": 0.00017266159347208214, + "loss": 0.9208, + "mean_token_accuracy": 0.7317855417728424, + "num_tokens": 34493724.0, + "step": 14910 + }, + { + "epoch": 0.13679288530301642, + "learning_rate": 0.0001726432566241863, + "loss": 0.8601, + "mean_token_accuracy": 0.7386585772037506, + "num_tokens": 34517071.0, + "step": 14920 + }, + { + "epoch": 0.13688456954249564, + "learning_rate": 0.00017262491977629047, + "loss": 0.8699, + "mean_token_accuracy": 0.7394436359405517, + "num_tokens": 34540311.0, + "step": 14930 + }, + { + "epoch": 0.13697625378197487, + "learning_rate": 0.00017260658292839464, + "loss": 0.8761, + "mean_token_accuracy": 0.7429749131202698, + "num_tokens": 34563600.0, + "step": 14940 + }, + { + "epoch": 0.13706793802145412, + "learning_rate": 0.00017258824608049877, + "loss": 0.8647, + "mean_token_accuracy": 0.7409651696681976, + "num_tokens": 34586227.0, + "step": 14950 + }, + { + "epoch": 0.13715962226093334, + "learning_rate": 0.0001725699092326029, + "loss": 0.846, + "mean_token_accuracy": 0.7521701097488404, + "num_tokens": 34609307.0, + "step": 14960 + }, + { + "epoch": 0.1372513065004126, + "learning_rate": 0.00017255157238470708, + "loss": 0.8579, + "mean_token_accuracy": 0.7402417600154877, + "num_tokens": 34632401.0, + "step": 14970 + }, + { + "epoch": 0.1373429907398918, + "learning_rate": 0.00017253323553681122, + "loss": 0.8366, + "mean_token_accuracy": 0.7455971479415894, + "num_tokens": 34655572.0, + "step": 14980 + }, + { + "epoch": 0.13743467497937104, + "learning_rate": 0.00017251489868891538, + "loss": 0.8303, + "mean_token_accuracy": 0.7452256083488464, + "num_tokens": 34678111.0, + "step": 14990 + }, + { + "epoch": 0.13752635921885029, + "learning_rate": 0.00017249656184101955, + "loss": 0.8298, + "mean_token_accuracy": 0.7465719163417817, + "num_tokens": 34702553.0, + "step": 15000 + }, + { + "epoch": 0.1376180434583295, + "learning_rate": 0.00017247822499312368, + "loss": 0.8511, + "mean_token_accuracy": 0.7408022582530975, + "num_tokens": 34725268.0, + "step": 15010 + }, + { + "epoch": 0.13770972769780876, + "learning_rate": 0.00017245988814522785, + "loss": 0.8866, + "mean_token_accuracy": 0.7359605014324189, + "num_tokens": 34748284.0, + "step": 15020 + }, + { + "epoch": 0.13780141193728798, + "learning_rate": 0.000172441551297332, + "loss": 0.8828, + "mean_token_accuracy": 0.7411446869373322, + "num_tokens": 34772131.0, + "step": 15030 + }, + { + "epoch": 0.1378930961767672, + "learning_rate": 0.00017242321444943615, + "loss": 0.8496, + "mean_token_accuracy": 0.7462159633636475, + "num_tokens": 34795648.0, + "step": 15040 + }, + { + "epoch": 0.13798478041624646, + "learning_rate": 0.0001724048776015403, + "loss": 0.8805, + "mean_token_accuracy": 0.7407910585403442, + "num_tokens": 34819991.0, + "step": 15050 + }, + { + "epoch": 0.13807646465572568, + "learning_rate": 0.00017238654075364446, + "loss": 0.8682, + "mean_token_accuracy": 0.742782711982727, + "num_tokens": 34843500.0, + "step": 15060 + }, + { + "epoch": 0.1381681488952049, + "learning_rate": 0.00017236820390574862, + "loss": 0.857, + "mean_token_accuracy": 0.7453341901302337, + "num_tokens": 34867460.0, + "step": 15070 + }, + { + "epoch": 0.13825983313468415, + "learning_rate": 0.00017234986705785276, + "loss": 0.8539, + "mean_token_accuracy": 0.7477288484573364, + "num_tokens": 34891119.0, + "step": 15080 + }, + { + "epoch": 0.13835151737416337, + "learning_rate": 0.00017233153020995693, + "loss": 0.8712, + "mean_token_accuracy": 0.7427833139896393, + "num_tokens": 34914637.0, + "step": 15090 + }, + { + "epoch": 0.13844320161364262, + "learning_rate": 0.00017231319336206107, + "loss": 0.8924, + "mean_token_accuracy": 0.7354365885257721, + "num_tokens": 34938035.0, + "step": 15100 + }, + { + "epoch": 0.13853488585312185, + "learning_rate": 0.0001722948565141652, + "loss": 0.8967, + "mean_token_accuracy": 0.7368919432163239, + "num_tokens": 34962046.0, + "step": 15110 + }, + { + "epoch": 0.13862657009260107, + "learning_rate": 0.0001722765196662694, + "loss": 0.8942, + "mean_token_accuracy": 0.7349571168422699, + "num_tokens": 34985902.0, + "step": 15120 + }, + { + "epoch": 0.13871825433208032, + "learning_rate": 0.00017225818281837353, + "loss": 0.8555, + "mean_token_accuracy": 0.7445537507534027, + "num_tokens": 35008986.0, + "step": 15130 + }, + { + "epoch": 0.13880993857155954, + "learning_rate": 0.0001722398459704777, + "loss": 0.8595, + "mean_token_accuracy": 0.7431390702724456, + "num_tokens": 35032371.0, + "step": 15140 + }, + { + "epoch": 0.1389016228110388, + "learning_rate": 0.00017222150912258184, + "loss": 0.9225, + "mean_token_accuracy": 0.7271012902259827, + "num_tokens": 35055932.0, + "step": 15150 + }, + { + "epoch": 0.13899330705051802, + "learning_rate": 0.00017220317227468598, + "loss": 0.8625, + "mean_token_accuracy": 0.7437769711017609, + "num_tokens": 35079900.0, + "step": 15160 + }, + { + "epoch": 0.13908499128999724, + "learning_rate": 0.00017218483542679014, + "loss": 0.8699, + "mean_token_accuracy": 0.741841334104538, + "num_tokens": 35103658.0, + "step": 15170 + }, + { + "epoch": 0.1391766755294765, + "learning_rate": 0.00017216649857889428, + "loss": 0.8824, + "mean_token_accuracy": 0.7311523973941803, + "num_tokens": 35126704.0, + "step": 15180 + }, + { + "epoch": 0.1392683597689557, + "learning_rate": 0.00017214816173099845, + "loss": 0.8449, + "mean_token_accuracy": 0.7465055763721467, + "num_tokens": 35149803.0, + "step": 15190 + }, + { + "epoch": 0.13936004400843496, + "learning_rate": 0.0001721298248831026, + "loss": 0.8934, + "mean_token_accuracy": 0.7403610050678253, + "num_tokens": 35173329.0, + "step": 15200 + }, + { + "epoch": 0.1394517282479142, + "learning_rate": 0.00017211148803520675, + "loss": 0.867, + "mean_token_accuracy": 0.7426059722900391, + "num_tokens": 35196346.0, + "step": 15210 + }, + { + "epoch": 0.1395434124873934, + "learning_rate": 0.00017209315118731091, + "loss": 0.8415, + "mean_token_accuracy": 0.7491662502288818, + "num_tokens": 35219268.0, + "step": 15220 + }, + { + "epoch": 0.13963509672687266, + "learning_rate": 0.00017207481433941505, + "loss": 0.9077, + "mean_token_accuracy": 0.7325476408004761, + "num_tokens": 35242623.0, + "step": 15230 + }, + { + "epoch": 0.13972678096635188, + "learning_rate": 0.00017205647749151922, + "loss": 0.8848, + "mean_token_accuracy": 0.7378370702266693, + "num_tokens": 35266277.0, + "step": 15240 + }, + { + "epoch": 0.1398184652058311, + "learning_rate": 0.00017203814064362338, + "loss": 0.8741, + "mean_token_accuracy": 0.7393323838710785, + "num_tokens": 35289214.0, + "step": 15250 + }, + { + "epoch": 0.13991014944531036, + "learning_rate": 0.00017201980379572752, + "loss": 0.8593, + "mean_token_accuracy": 0.7427632868289947, + "num_tokens": 35311458.0, + "step": 15260 + }, + { + "epoch": 0.14000183368478958, + "learning_rate": 0.0001720014669478317, + "loss": 0.8552, + "mean_token_accuracy": 0.7470477044582366, + "num_tokens": 35333737.0, + "step": 15270 + }, + { + "epoch": 0.14009351792426883, + "learning_rate": 0.00017198313009993583, + "loss": 0.8898, + "mean_token_accuracy": 0.7392634630203248, + "num_tokens": 35357066.0, + "step": 15280 + }, + { + "epoch": 0.14018520216374805, + "learning_rate": 0.00017196479325204, + "loss": 0.891, + "mean_token_accuracy": 0.741010183095932, + "num_tokens": 35379496.0, + "step": 15290 + }, + { + "epoch": 0.14027688640322727, + "learning_rate": 0.00017194645640414413, + "loss": 0.8885, + "mean_token_accuracy": 0.7416484355926514, + "num_tokens": 35402315.0, + "step": 15300 + }, + { + "epoch": 0.14036857064270652, + "learning_rate": 0.00017192811955624827, + "loss": 0.867, + "mean_token_accuracy": 0.736742228269577, + "num_tokens": 35425384.0, + "step": 15310 + }, + { + "epoch": 0.14046025488218575, + "learning_rate": 0.00017190978270835246, + "loss": 0.8352, + "mean_token_accuracy": 0.748482209444046, + "num_tokens": 35448273.0, + "step": 15320 + }, + { + "epoch": 0.140551939121665, + "learning_rate": 0.0001718914458604566, + "loss": 0.8616, + "mean_token_accuracy": 0.7401842474937439, + "num_tokens": 35471443.0, + "step": 15330 + }, + { + "epoch": 0.14064362336114422, + "learning_rate": 0.00017187310901256076, + "loss": 0.8454, + "mean_token_accuracy": 0.7439776420593261, + "num_tokens": 35494220.0, + "step": 15340 + }, + { + "epoch": 0.14073530760062344, + "learning_rate": 0.0001718547721646649, + "loss": 0.8585, + "mean_token_accuracy": 0.7468129754066467, + "num_tokens": 35516708.0, + "step": 15350 + }, + { + "epoch": 0.1408269918401027, + "learning_rate": 0.00017183643531676904, + "loss": 0.8568, + "mean_token_accuracy": 0.7475004255771637, + "num_tokens": 35539775.0, + "step": 15360 + }, + { + "epoch": 0.14091867607958192, + "learning_rate": 0.0001718180984688732, + "loss": 0.8814, + "mean_token_accuracy": 0.7429614782333374, + "num_tokens": 35564023.0, + "step": 15370 + }, + { + "epoch": 0.14101036031906114, + "learning_rate": 0.00017179976162097737, + "loss": 0.8494, + "mean_token_accuracy": 0.748023945093155, + "num_tokens": 35587842.0, + "step": 15380 + }, + { + "epoch": 0.1411020445585404, + "learning_rate": 0.0001717814247730815, + "loss": 0.894, + "mean_token_accuracy": 0.7352497637271881, + "num_tokens": 35610698.0, + "step": 15390 + }, + { + "epoch": 0.1411937287980196, + "learning_rate": 0.00017176308792518568, + "loss": 0.8624, + "mean_token_accuracy": 0.7445066869258881, + "num_tokens": 35633919.0, + "step": 15400 + }, + { + "epoch": 0.14128541303749886, + "learning_rate": 0.00017174475107728981, + "loss": 0.8812, + "mean_token_accuracy": 0.7427648067474365, + "num_tokens": 35656371.0, + "step": 15410 + }, + { + "epoch": 0.1413770972769781, + "learning_rate": 0.00017172641422939398, + "loss": 0.858, + "mean_token_accuracy": 0.7444013237953186, + "num_tokens": 35679926.0, + "step": 15420 + }, + { + "epoch": 0.1414687815164573, + "learning_rate": 0.00017170807738149812, + "loss": 0.8924, + "mean_token_accuracy": 0.7378455460071563, + "num_tokens": 35704186.0, + "step": 15430 + }, + { + "epoch": 0.14156046575593656, + "learning_rate": 0.00017168974053360228, + "loss": 0.8943, + "mean_token_accuracy": 0.7372198641300202, + "num_tokens": 35727393.0, + "step": 15440 + }, + { + "epoch": 0.14165214999541578, + "learning_rate": 0.00017167140368570645, + "loss": 0.8957, + "mean_token_accuracy": 0.734748101234436, + "num_tokens": 35749874.0, + "step": 15450 + }, + { + "epoch": 0.14174383423489503, + "learning_rate": 0.0001716530668378106, + "loss": 0.8487, + "mean_token_accuracy": 0.7426269173622131, + "num_tokens": 35772862.0, + "step": 15460 + }, + { + "epoch": 0.14183551847437426, + "learning_rate": 0.00017163472998991475, + "loss": 0.8364, + "mean_token_accuracy": 0.7502005517482757, + "num_tokens": 35795644.0, + "step": 15470 + }, + { + "epoch": 0.14192720271385348, + "learning_rate": 0.0001716163931420189, + "loss": 0.8928, + "mean_token_accuracy": 0.7369527220726013, + "num_tokens": 35818756.0, + "step": 15480 + }, + { + "epoch": 0.14201888695333273, + "learning_rate": 0.00017159805629412306, + "loss": 0.8422, + "mean_token_accuracy": 0.748214191198349, + "num_tokens": 35841885.0, + "step": 15490 + }, + { + "epoch": 0.14211057119281195, + "learning_rate": 0.0001715797194462272, + "loss": 0.8917, + "mean_token_accuracy": 0.7364135205745697, + "num_tokens": 35865058.0, + "step": 15500 + }, + { + "epoch": 0.1422022554322912, + "learning_rate": 0.00017156138259833136, + "loss": 0.8266, + "mean_token_accuracy": 0.7535389542579651, + "num_tokens": 35888439.0, + "step": 15510 + }, + { + "epoch": 0.14229393967177043, + "learning_rate": 0.00017154304575043552, + "loss": 0.8666, + "mean_token_accuracy": 0.736277061700821, + "num_tokens": 35912253.0, + "step": 15520 + }, + { + "epoch": 0.14238562391124965, + "learning_rate": 0.00017152470890253966, + "loss": 0.8887, + "mean_token_accuracy": 0.7365772306919098, + "num_tokens": 35935184.0, + "step": 15530 + }, + { + "epoch": 0.1424773081507289, + "learning_rate": 0.00017150637205464383, + "loss": 0.9029, + "mean_token_accuracy": 0.7392226040363312, + "num_tokens": 35957892.0, + "step": 15540 + }, + { + "epoch": 0.14256899239020812, + "learning_rate": 0.00017148803520674797, + "loss": 0.8513, + "mean_token_accuracy": 0.7421040892601013, + "num_tokens": 35980740.0, + "step": 15550 + }, + { + "epoch": 0.14266067662968734, + "learning_rate": 0.0001714696983588521, + "loss": 0.8492, + "mean_token_accuracy": 0.738554447889328, + "num_tokens": 36004105.0, + "step": 15560 + }, + { + "epoch": 0.1427523608691666, + "learning_rate": 0.00017145136151095627, + "loss": 0.8761, + "mean_token_accuracy": 0.7424564182758331, + "num_tokens": 36027396.0, + "step": 15570 + }, + { + "epoch": 0.14284404510864582, + "learning_rate": 0.00017143302466306044, + "loss": 0.8548, + "mean_token_accuracy": 0.741351866722107, + "num_tokens": 36050220.0, + "step": 15580 + }, + { + "epoch": 0.14293572934812507, + "learning_rate": 0.00017141468781516457, + "loss": 0.8722, + "mean_token_accuracy": 0.7424733400344848, + "num_tokens": 36074020.0, + "step": 15590 + }, + { + "epoch": 0.1430274135876043, + "learning_rate": 0.00017139635096726874, + "loss": 0.8819, + "mean_token_accuracy": 0.7411562919616699, + "num_tokens": 36096764.0, + "step": 15600 + }, + { + "epoch": 0.1431190978270835, + "learning_rate": 0.00017137801411937288, + "loss": 0.8361, + "mean_token_accuracy": 0.7521393835544586, + "num_tokens": 36119354.0, + "step": 15610 + }, + { + "epoch": 0.14321078206656276, + "learning_rate": 0.00017135967727147704, + "loss": 0.8811, + "mean_token_accuracy": 0.7374622523784637, + "num_tokens": 36143320.0, + "step": 15620 + }, + { + "epoch": 0.143302466306042, + "learning_rate": 0.00017134134042358118, + "loss": 0.9099, + "mean_token_accuracy": 0.7347093343734741, + "num_tokens": 36167441.0, + "step": 15630 + }, + { + "epoch": 0.14339415054552124, + "learning_rate": 0.00017132300357568535, + "loss": 0.8793, + "mean_token_accuracy": 0.7435518801212311, + "num_tokens": 36190208.0, + "step": 15640 + }, + { + "epoch": 0.14348583478500046, + "learning_rate": 0.0001713046667277895, + "loss": 0.8869, + "mean_token_accuracy": 0.7344530284404754, + "num_tokens": 36212747.0, + "step": 15650 + }, + { + "epoch": 0.14357751902447968, + "learning_rate": 0.00017128632987989365, + "loss": 0.9215, + "mean_token_accuracy": 0.7322555363178254, + "num_tokens": 36236226.0, + "step": 15660 + }, + { + "epoch": 0.14366920326395893, + "learning_rate": 0.00017126799303199782, + "loss": 0.916, + "mean_token_accuracy": 0.739119553565979, + "num_tokens": 36259439.0, + "step": 15670 + }, + { + "epoch": 0.14376088750343816, + "learning_rate": 0.00017124965618410195, + "loss": 0.8543, + "mean_token_accuracy": 0.7416538894176483, + "num_tokens": 36282354.0, + "step": 15680 + }, + { + "epoch": 0.14385257174291738, + "learning_rate": 0.00017123131933620612, + "loss": 0.8778, + "mean_token_accuracy": 0.7373986840248108, + "num_tokens": 36305510.0, + "step": 15690 + }, + { + "epoch": 0.14394425598239663, + "learning_rate": 0.00017121298248831026, + "loss": 0.8462, + "mean_token_accuracy": 0.753288346529007, + "num_tokens": 36328607.0, + "step": 15700 + }, + { + "epoch": 0.14403594022187585, + "learning_rate": 0.00017119464564041442, + "loss": 0.8365, + "mean_token_accuracy": 0.7509838223457337, + "num_tokens": 36351930.0, + "step": 15710 + }, + { + "epoch": 0.1441276244613551, + "learning_rate": 0.0001711763087925186, + "loss": 0.8594, + "mean_token_accuracy": 0.7432153224945068, + "num_tokens": 36374693.0, + "step": 15720 + }, + { + "epoch": 0.14421930870083433, + "learning_rate": 0.00017115797194462273, + "loss": 0.8842, + "mean_token_accuracy": 0.7355160593986512, + "num_tokens": 36398007.0, + "step": 15730 + }, + { + "epoch": 0.14431099294031355, + "learning_rate": 0.0001711396350967269, + "loss": 0.8893, + "mean_token_accuracy": 0.7363717138767243, + "num_tokens": 36420952.0, + "step": 15740 + }, + { + "epoch": 0.1444026771797928, + "learning_rate": 0.00017112129824883103, + "loss": 0.8924, + "mean_token_accuracy": 0.7350456714630127, + "num_tokens": 36443933.0, + "step": 15750 + }, + { + "epoch": 0.14449436141927202, + "learning_rate": 0.00017110296140093517, + "loss": 0.9009, + "mean_token_accuracy": 0.7325533866882324, + "num_tokens": 36466978.0, + "step": 15760 + }, + { + "epoch": 0.14458604565875127, + "learning_rate": 0.00017108462455303934, + "loss": 0.8756, + "mean_token_accuracy": 0.7401955187320709, + "num_tokens": 36489975.0, + "step": 15770 + }, + { + "epoch": 0.1446777298982305, + "learning_rate": 0.0001710662877051435, + "loss": 0.856, + "mean_token_accuracy": 0.7392392814159393, + "num_tokens": 36513624.0, + "step": 15780 + }, + { + "epoch": 0.14476941413770972, + "learning_rate": 0.00017104795085724764, + "loss": 0.864, + "mean_token_accuracy": 0.7432485938072204, + "num_tokens": 36536843.0, + "step": 15790 + }, + { + "epoch": 0.14486109837718897, + "learning_rate": 0.0001710296140093518, + "loss": 0.861, + "mean_token_accuracy": 0.7388611733913422, + "num_tokens": 36559656.0, + "step": 15800 + }, + { + "epoch": 0.1449527826166682, + "learning_rate": 0.00017101127716145594, + "loss": 0.9033, + "mean_token_accuracy": 0.7361470818519592, + "num_tokens": 36583295.0, + "step": 15810 + }, + { + "epoch": 0.14504446685614744, + "learning_rate": 0.0001709929403135601, + "loss": 0.8875, + "mean_token_accuracy": 0.7397248089313507, + "num_tokens": 36605779.0, + "step": 15820 + }, + { + "epoch": 0.14513615109562666, + "learning_rate": 0.00017097460346566425, + "loss": 0.8691, + "mean_token_accuracy": 0.7428908169269561, + "num_tokens": 36628121.0, + "step": 15830 + }, + { + "epoch": 0.1452278353351059, + "learning_rate": 0.0001709562666177684, + "loss": 0.8702, + "mean_token_accuracy": 0.7383060693740845, + "num_tokens": 36651628.0, + "step": 15840 + }, + { + "epoch": 0.14531951957458514, + "learning_rate": 0.00017093792976987258, + "loss": 0.8666, + "mean_token_accuracy": 0.7416314542293548, + "num_tokens": 36674567.0, + "step": 15850 + }, + { + "epoch": 0.14541120381406436, + "learning_rate": 0.00017091959292197672, + "loss": 0.9071, + "mean_token_accuracy": 0.734781700372696, + "num_tokens": 36697863.0, + "step": 15860 + }, + { + "epoch": 0.14550288805354358, + "learning_rate": 0.00017090125607408088, + "loss": 0.9083, + "mean_token_accuracy": 0.7320820689201355, + "num_tokens": 36721003.0, + "step": 15870 + }, + { + "epoch": 0.14559457229302283, + "learning_rate": 0.00017088291922618502, + "loss": 0.8586, + "mean_token_accuracy": 0.7432838439941406, + "num_tokens": 36743910.0, + "step": 15880 + }, + { + "epoch": 0.14568625653250206, + "learning_rate": 0.00017086458237828918, + "loss": 0.8947, + "mean_token_accuracy": 0.739415991306305, + "num_tokens": 36766315.0, + "step": 15890 + }, + { + "epoch": 0.1457779407719813, + "learning_rate": 0.00017084624553039332, + "loss": 0.8755, + "mean_token_accuracy": 0.7403792202472687, + "num_tokens": 36788852.0, + "step": 15900 + }, + { + "epoch": 0.14586962501146053, + "learning_rate": 0.0001708279086824975, + "loss": 0.8744, + "mean_token_accuracy": 0.7431094586849213, + "num_tokens": 36811735.0, + "step": 15910 + }, + { + "epoch": 0.14596130925093975, + "learning_rate": 0.00017080957183460165, + "loss": 0.8407, + "mean_token_accuracy": 0.7473398447036743, + "num_tokens": 36834411.0, + "step": 15920 + }, + { + "epoch": 0.146052993490419, + "learning_rate": 0.0001707912349867058, + "loss": 0.8466, + "mean_token_accuracy": 0.749835342168808, + "num_tokens": 36856962.0, + "step": 15930 + }, + { + "epoch": 0.14614467772989823, + "learning_rate": 0.00017077289813880996, + "loss": 0.8417, + "mean_token_accuracy": 0.7449469566345215, + "num_tokens": 36880853.0, + "step": 15940 + }, + { + "epoch": 0.14623636196937748, + "learning_rate": 0.0001707545612909141, + "loss": 0.8946, + "mean_token_accuracy": 0.7358967542648316, + "num_tokens": 36904041.0, + "step": 15950 + }, + { + "epoch": 0.1463280462088567, + "learning_rate": 0.00017073622444301823, + "loss": 0.9127, + "mean_token_accuracy": 0.7398579776287079, + "num_tokens": 36927780.0, + "step": 15960 + }, + { + "epoch": 0.14641973044833592, + "learning_rate": 0.00017071788759512243, + "loss": 0.8529, + "mean_token_accuracy": 0.7463305592536926, + "num_tokens": 36950260.0, + "step": 15970 + }, + { + "epoch": 0.14651141468781517, + "learning_rate": 0.00017069955074722656, + "loss": 0.8771, + "mean_token_accuracy": 0.7401873469352722, + "num_tokens": 36973332.0, + "step": 15980 + }, + { + "epoch": 0.1466030989272944, + "learning_rate": 0.0001706812138993307, + "loss": 0.8793, + "mean_token_accuracy": 0.7394184529781341, + "num_tokens": 36996111.0, + "step": 15990 + }, + { + "epoch": 0.14669478316677362, + "learning_rate": 0.00017066287705143487, + "loss": 0.88, + "mean_token_accuracy": 0.7426718354225159, + "num_tokens": 37019427.0, + "step": 16000 + }, + { + "epoch": 0.14678646740625287, + "learning_rate": 0.000170644540203539, + "loss": 0.9024, + "mean_token_accuracy": 0.7295919239521027, + "num_tokens": 37043087.0, + "step": 16010 + }, + { + "epoch": 0.1468781516457321, + "learning_rate": 0.00017062620335564317, + "loss": 0.8745, + "mean_token_accuracy": 0.7450354874134064, + "num_tokens": 37066364.0, + "step": 16020 + }, + { + "epoch": 0.14696983588521134, + "learning_rate": 0.0001706078665077473, + "loss": 0.8659, + "mean_token_accuracy": 0.7447131872177124, + "num_tokens": 37089369.0, + "step": 16030 + }, + { + "epoch": 0.14706152012469056, + "learning_rate": 0.00017058952965985148, + "loss": 0.8537, + "mean_token_accuracy": 0.7468583405017852, + "num_tokens": 37112609.0, + "step": 16040 + }, + { + "epoch": 0.1471532043641698, + "learning_rate": 0.00017057119281195564, + "loss": 0.9012, + "mean_token_accuracy": 0.7315944612026215, + "num_tokens": 37135391.0, + "step": 16050 + }, + { + "epoch": 0.14724488860364904, + "learning_rate": 0.00017055285596405978, + "loss": 0.8897, + "mean_token_accuracy": 0.7404382467269898, + "num_tokens": 37157542.0, + "step": 16060 + }, + { + "epoch": 0.14733657284312826, + "learning_rate": 0.00017053451911616395, + "loss": 0.853, + "mean_token_accuracy": 0.7500638067722321, + "num_tokens": 37180347.0, + "step": 16070 + }, + { + "epoch": 0.1474282570826075, + "learning_rate": 0.00017051618226826808, + "loss": 0.865, + "mean_token_accuracy": 0.7455952882766723, + "num_tokens": 37203148.0, + "step": 16080 + }, + { + "epoch": 0.14751994132208673, + "learning_rate": 0.00017049784542037225, + "loss": 0.8444, + "mean_token_accuracy": 0.7497556746006012, + "num_tokens": 37226287.0, + "step": 16090 + }, + { + "epoch": 0.14761162556156596, + "learning_rate": 0.00017047950857247641, + "loss": 0.8825, + "mean_token_accuracy": 0.7477022767066955, + "num_tokens": 37249004.0, + "step": 16100 + }, + { + "epoch": 0.1477033098010452, + "learning_rate": 0.00017046117172458055, + "loss": 0.8668, + "mean_token_accuracy": 0.7420090973377228, + "num_tokens": 37272304.0, + "step": 16110 + }, + { + "epoch": 0.14779499404052443, + "learning_rate": 0.00017044283487668472, + "loss": 0.8671, + "mean_token_accuracy": 0.7381621420383453, + "num_tokens": 37295281.0, + "step": 16120 + }, + { + "epoch": 0.14788667828000368, + "learning_rate": 0.00017042449802878886, + "loss": 0.8722, + "mean_token_accuracy": 0.740356034040451, + "num_tokens": 37317828.0, + "step": 16130 + }, + { + "epoch": 0.1479783625194829, + "learning_rate": 0.00017040616118089302, + "loss": 0.8633, + "mean_token_accuracy": 0.7404953300952911, + "num_tokens": 37340704.0, + "step": 16140 + }, + { + "epoch": 0.14807004675896213, + "learning_rate": 0.00017038782433299716, + "loss": 0.8389, + "mean_token_accuracy": 0.7452967226505279, + "num_tokens": 37362928.0, + "step": 16150 + }, + { + "epoch": 0.14816173099844138, + "learning_rate": 0.0001703694874851013, + "loss": 0.8689, + "mean_token_accuracy": 0.7365191996097564, + "num_tokens": 37385600.0, + "step": 16160 + }, + { + "epoch": 0.1482534152379206, + "learning_rate": 0.0001703511506372055, + "loss": 0.8949, + "mean_token_accuracy": 0.7305776953697205, + "num_tokens": 37408518.0, + "step": 16170 + }, + { + "epoch": 0.14834509947739982, + "learning_rate": 0.00017033281378930963, + "loss": 0.8396, + "mean_token_accuracy": 0.7508726000785828, + "num_tokens": 37431714.0, + "step": 16180 + }, + { + "epoch": 0.14843678371687907, + "learning_rate": 0.00017031447694141377, + "loss": 0.8877, + "mean_token_accuracy": 0.7442928493022919, + "num_tokens": 37455286.0, + "step": 16190 + }, + { + "epoch": 0.1485284679563583, + "learning_rate": 0.00017029614009351793, + "loss": 0.8895, + "mean_token_accuracy": 0.738189160823822, + "num_tokens": 37478469.0, + "step": 16200 + }, + { + "epoch": 0.14862015219583755, + "learning_rate": 0.00017027780324562207, + "loss": 0.8995, + "mean_token_accuracy": 0.7329420864582061, + "num_tokens": 37501267.0, + "step": 16210 + }, + { + "epoch": 0.14871183643531677, + "learning_rate": 0.00017025946639772624, + "loss": 0.8444, + "mean_token_accuracy": 0.7452007949352264, + "num_tokens": 37523554.0, + "step": 16220 + }, + { + "epoch": 0.148803520674796, + "learning_rate": 0.0001702411295498304, + "loss": 0.9022, + "mean_token_accuracy": 0.73763148188591, + "num_tokens": 37547044.0, + "step": 16230 + }, + { + "epoch": 0.14889520491427524, + "learning_rate": 0.00017022279270193454, + "loss": 0.8462, + "mean_token_accuracy": 0.7493780314922333, + "num_tokens": 37569517.0, + "step": 16240 + }, + { + "epoch": 0.14898688915375446, + "learning_rate": 0.0001702044558540387, + "loss": 0.9, + "mean_token_accuracy": 0.736665791273117, + "num_tokens": 37592746.0, + "step": 16250 + }, + { + "epoch": 0.14907857339323372, + "learning_rate": 0.00017018611900614284, + "loss": 0.9179, + "mean_token_accuracy": 0.7329012751579285, + "num_tokens": 37616892.0, + "step": 16260 + }, + { + "epoch": 0.14917025763271294, + "learning_rate": 0.000170167782158247, + "loss": 0.8869, + "mean_token_accuracy": 0.7348154604434967, + "num_tokens": 37640878.0, + "step": 16270 + }, + { + "epoch": 0.14926194187219216, + "learning_rate": 0.00017014944531035115, + "loss": 0.8831, + "mean_token_accuracy": 0.7386293411254883, + "num_tokens": 37664360.0, + "step": 16280 + }, + { + "epoch": 0.1493536261116714, + "learning_rate": 0.0001701311084624553, + "loss": 0.8402, + "mean_token_accuracy": 0.7535671114921569, + "num_tokens": 37688008.0, + "step": 16290 + }, + { + "epoch": 0.14944531035115063, + "learning_rate": 0.00017011277161455948, + "loss": 0.8639, + "mean_token_accuracy": 0.7393059194087982, + "num_tokens": 37710843.0, + "step": 16300 + }, + { + "epoch": 0.14953699459062986, + "learning_rate": 0.00017009443476666362, + "loss": 0.8823, + "mean_token_accuracy": 0.7435824513435364, + "num_tokens": 37734174.0, + "step": 16310 + }, + { + "epoch": 0.1496286788301091, + "learning_rate": 0.00017007609791876778, + "loss": 0.8803, + "mean_token_accuracy": 0.7369657516479492, + "num_tokens": 37757725.0, + "step": 16320 + }, + { + "epoch": 0.14972036306958833, + "learning_rate": 0.00017005776107087192, + "loss": 0.8222, + "mean_token_accuracy": 0.7561168491840362, + "num_tokens": 37780735.0, + "step": 16330 + }, + { + "epoch": 0.14981204730906758, + "learning_rate": 0.00017003942422297609, + "loss": 0.8919, + "mean_token_accuracy": 0.7403030455112457, + "num_tokens": 37803988.0, + "step": 16340 + }, + { + "epoch": 0.1499037315485468, + "learning_rate": 0.00017002108737508022, + "loss": 0.8943, + "mean_token_accuracy": 0.7361368477344513, + "num_tokens": 37827326.0, + "step": 16350 + }, + { + "epoch": 0.14999541578802603, + "learning_rate": 0.0001700027505271844, + "loss": 0.9001, + "mean_token_accuracy": 0.7352225959300995, + "num_tokens": 37849799.0, + "step": 16360 + }, + { + "epoch": 0.15008710002750528, + "learning_rate": 0.00016998441367928856, + "loss": 0.8698, + "mean_token_accuracy": 0.7423892736434936, + "num_tokens": 37872842.0, + "step": 16370 + }, + { + "epoch": 0.1501787842669845, + "learning_rate": 0.0001699660768313927, + "loss": 0.8658, + "mean_token_accuracy": 0.74049591422081, + "num_tokens": 37896520.0, + "step": 16380 + }, + { + "epoch": 0.15027046850646375, + "learning_rate": 0.00016994773998349683, + "loss": 0.8559, + "mean_token_accuracy": 0.7443911910057068, + "num_tokens": 37919910.0, + "step": 16390 + }, + { + "epoch": 0.15036215274594297, + "learning_rate": 0.000169929403135601, + "loss": 0.8546, + "mean_token_accuracy": 0.7446241974830627, + "num_tokens": 37943244.0, + "step": 16400 + }, + { + "epoch": 0.1504538369854222, + "learning_rate": 0.00016991106628770514, + "loss": 0.8407, + "mean_token_accuracy": 0.7498221933841706, + "num_tokens": 37966098.0, + "step": 16410 + }, + { + "epoch": 0.15054552122490145, + "learning_rate": 0.0001698927294398093, + "loss": 0.9167, + "mean_token_accuracy": 0.7348417937755585, + "num_tokens": 37989078.0, + "step": 16420 + }, + { + "epoch": 0.15063720546438067, + "learning_rate": 0.00016987439259191347, + "loss": 0.9307, + "mean_token_accuracy": 0.7289546847343444, + "num_tokens": 38012011.0, + "step": 16430 + }, + { + "epoch": 0.15072888970385992, + "learning_rate": 0.0001698560557440176, + "loss": 0.8998, + "mean_token_accuracy": 0.7262084662914277, + "num_tokens": 38035169.0, + "step": 16440 + }, + { + "epoch": 0.15082057394333914, + "learning_rate": 0.00016983771889612177, + "loss": 0.8371, + "mean_token_accuracy": 0.7426431775093079, + "num_tokens": 38058471.0, + "step": 16450 + }, + { + "epoch": 0.15091225818281837, + "learning_rate": 0.0001698193820482259, + "loss": 0.8904, + "mean_token_accuracy": 0.7356981933116913, + "num_tokens": 38081511.0, + "step": 16460 + }, + { + "epoch": 0.15100394242229762, + "learning_rate": 0.00016980104520033007, + "loss": 0.8985, + "mean_token_accuracy": 0.736701226234436, + "num_tokens": 38104079.0, + "step": 16470 + }, + { + "epoch": 0.15109562666177684, + "learning_rate": 0.0001697827083524342, + "loss": 0.8682, + "mean_token_accuracy": 0.7417209446430206, + "num_tokens": 38126801.0, + "step": 16480 + }, + { + "epoch": 0.15118731090125606, + "learning_rate": 0.00016976437150453838, + "loss": 0.8731, + "mean_token_accuracy": 0.7413496732711792, + "num_tokens": 38149794.0, + "step": 16490 + }, + { + "epoch": 0.1512789951407353, + "learning_rate": 0.00016974603465664254, + "loss": 0.8699, + "mean_token_accuracy": 0.7438834309577942, + "num_tokens": 38172585.0, + "step": 16500 + }, + { + "epoch": 0.15137067938021453, + "learning_rate": 0.00016972769780874668, + "loss": 0.84, + "mean_token_accuracy": 0.7425670325756073, + "num_tokens": 38195448.0, + "step": 16510 + }, + { + "epoch": 0.15146236361969379, + "learning_rate": 0.00016970936096085085, + "loss": 0.8955, + "mean_token_accuracy": 0.7389983892440796, + "num_tokens": 38219907.0, + "step": 16520 + }, + { + "epoch": 0.151554047859173, + "learning_rate": 0.00016969102411295499, + "loss": 0.8762, + "mean_token_accuracy": 0.7366839945316315, + "num_tokens": 38242733.0, + "step": 16530 + }, + { + "epoch": 0.15164573209865223, + "learning_rate": 0.00016967268726505915, + "loss": 0.9292, + "mean_token_accuracy": 0.7314104080200196, + "num_tokens": 38265375.0, + "step": 16540 + }, + { + "epoch": 0.15173741633813148, + "learning_rate": 0.0001696543504171633, + "loss": 0.8543, + "mean_token_accuracy": 0.7488788306713104, + "num_tokens": 38288239.0, + "step": 16550 + }, + { + "epoch": 0.1518291005776107, + "learning_rate": 0.00016963601356926745, + "loss": 0.8892, + "mean_token_accuracy": 0.7305476188659668, + "num_tokens": 38311485.0, + "step": 16560 + }, + { + "epoch": 0.15192078481708995, + "learning_rate": 0.00016961767672137162, + "loss": 0.8634, + "mean_token_accuracy": 0.7440915644168854, + "num_tokens": 38334683.0, + "step": 16570 + }, + { + "epoch": 0.15201246905656918, + "learning_rate": 0.00016959933987347576, + "loss": 0.8663, + "mean_token_accuracy": 0.7366457760334015, + "num_tokens": 38357877.0, + "step": 16580 + }, + { + "epoch": 0.1521041532960484, + "learning_rate": 0.0001695810030255799, + "loss": 0.8546, + "mean_token_accuracy": 0.7432753086090088, + "num_tokens": 38380922.0, + "step": 16590 + }, + { + "epoch": 0.15219583753552765, + "learning_rate": 0.00016956266617768406, + "loss": 0.8485, + "mean_token_accuracy": 0.7470687568187714, + "num_tokens": 38403242.0, + "step": 16600 + }, + { + "epoch": 0.15228752177500687, + "learning_rate": 0.0001695443293297882, + "loss": 0.849, + "mean_token_accuracy": 0.7500737011432648, + "num_tokens": 38426605.0, + "step": 16610 + }, + { + "epoch": 0.1523792060144861, + "learning_rate": 0.0001695259924818924, + "loss": 0.8631, + "mean_token_accuracy": 0.747471010684967, + "num_tokens": 38449559.0, + "step": 16620 + }, + { + "epoch": 0.15247089025396535, + "learning_rate": 0.00016950765563399653, + "loss": 0.871, + "mean_token_accuracy": 0.7461052656173706, + "num_tokens": 38472792.0, + "step": 16630 + }, + { + "epoch": 0.15256257449344457, + "learning_rate": 0.00016948931878610067, + "loss": 0.888, + "mean_token_accuracy": 0.7389775276184082, + "num_tokens": 38496150.0, + "step": 16640 + }, + { + "epoch": 0.15265425873292382, + "learning_rate": 0.00016947098193820483, + "loss": 0.8231, + "mean_token_accuracy": 0.751199460029602, + "num_tokens": 38519388.0, + "step": 16650 + }, + { + "epoch": 0.15274594297240304, + "learning_rate": 0.00016945264509030897, + "loss": 0.7743, + "mean_token_accuracy": 0.7645283997058868, + "num_tokens": 38541871.0, + "step": 16660 + }, + { + "epoch": 0.15283762721188227, + "learning_rate": 0.00016943430824241314, + "loss": 0.8537, + "mean_token_accuracy": 0.7426731526851654, + "num_tokens": 38565786.0, + "step": 16670 + }, + { + "epoch": 0.15292931145136152, + "learning_rate": 0.00016941597139451728, + "loss": 0.8846, + "mean_token_accuracy": 0.7351303577423096, + "num_tokens": 38588275.0, + "step": 16680 + }, + { + "epoch": 0.15302099569084074, + "learning_rate": 0.00016939763454662144, + "loss": 0.8786, + "mean_token_accuracy": 0.7357687294483185, + "num_tokens": 38611373.0, + "step": 16690 + }, + { + "epoch": 0.15311267993032, + "learning_rate": 0.0001693792976987256, + "loss": 0.8672, + "mean_token_accuracy": 0.7499398589134216, + "num_tokens": 38635003.0, + "step": 16700 + }, + { + "epoch": 0.1532043641697992, + "learning_rate": 0.00016936096085082975, + "loss": 0.8927, + "mean_token_accuracy": 0.7349049627780915, + "num_tokens": 38657858.0, + "step": 16710 + }, + { + "epoch": 0.15329604840927843, + "learning_rate": 0.0001693426240029339, + "loss": 0.8161, + "mean_token_accuracy": 0.7554900467395782, + "num_tokens": 38680885.0, + "step": 16720 + }, + { + "epoch": 0.15338773264875769, + "learning_rate": 0.00016932428715503805, + "loss": 0.8772, + "mean_token_accuracy": 0.7395583987236023, + "num_tokens": 38704389.0, + "step": 16730 + }, + { + "epoch": 0.1534794168882369, + "learning_rate": 0.00016930595030714222, + "loss": 0.8847, + "mean_token_accuracy": 0.7397893249988556, + "num_tokens": 38726402.0, + "step": 16740 + }, + { + "epoch": 0.15357110112771616, + "learning_rate": 0.00016928761345924638, + "loss": 0.8861, + "mean_token_accuracy": 0.7350054621696472, + "num_tokens": 38748572.0, + "step": 16750 + }, + { + "epoch": 0.15366278536719538, + "learning_rate": 0.00016926927661135052, + "loss": 0.8551, + "mean_token_accuracy": 0.7403785765171051, + "num_tokens": 38771042.0, + "step": 16760 + }, + { + "epoch": 0.1537544696066746, + "learning_rate": 0.00016925093976345468, + "loss": 0.8563, + "mean_token_accuracy": 0.7481821477413177, + "num_tokens": 38793985.0, + "step": 16770 + }, + { + "epoch": 0.15384615384615385, + "learning_rate": 0.00016923260291555882, + "loss": 0.9078, + "mean_token_accuracy": 0.7312174201011657, + "num_tokens": 38817376.0, + "step": 16780 + }, + { + "epoch": 0.15393783808563308, + "learning_rate": 0.00016921426606766296, + "loss": 0.896, + "mean_token_accuracy": 0.7304867029190063, + "num_tokens": 38840997.0, + "step": 16790 + }, + { + "epoch": 0.1540295223251123, + "learning_rate": 0.00016919592921976713, + "loss": 0.9133, + "mean_token_accuracy": 0.7256821393966675, + "num_tokens": 38864395.0, + "step": 16800 + }, + { + "epoch": 0.15412120656459155, + "learning_rate": 0.00016917759237187126, + "loss": 0.8646, + "mean_token_accuracy": 0.7446182489395141, + "num_tokens": 38887982.0, + "step": 16810 + }, + { + "epoch": 0.15421289080407077, + "learning_rate": 0.00016915925552397546, + "loss": 0.8449, + "mean_token_accuracy": 0.7444073379039764, + "num_tokens": 38911351.0, + "step": 16820 + }, + { + "epoch": 0.15430457504355002, + "learning_rate": 0.0001691409186760796, + "loss": 0.8894, + "mean_token_accuracy": 0.7392773270606995, + "num_tokens": 38934444.0, + "step": 16830 + }, + { + "epoch": 0.15439625928302925, + "learning_rate": 0.00016912258182818373, + "loss": 0.8657, + "mean_token_accuracy": 0.7407513499259949, + "num_tokens": 38957685.0, + "step": 16840 + }, + { + "epoch": 0.15448794352250847, + "learning_rate": 0.0001691042449802879, + "loss": 0.8771, + "mean_token_accuracy": 0.7445762813091278, + "num_tokens": 38980926.0, + "step": 16850 + }, + { + "epoch": 0.15457962776198772, + "learning_rate": 0.00016908590813239204, + "loss": 0.8764, + "mean_token_accuracy": 0.740376353263855, + "num_tokens": 39003981.0, + "step": 16860 + }, + { + "epoch": 0.15467131200146694, + "learning_rate": 0.0001690675712844962, + "loss": 0.8618, + "mean_token_accuracy": 0.7444840729236603, + "num_tokens": 39026544.0, + "step": 16870 + }, + { + "epoch": 0.1547629962409462, + "learning_rate": 0.00016904923443660034, + "loss": 0.8746, + "mean_token_accuracy": 0.7461060881614685, + "num_tokens": 39050280.0, + "step": 16880 + }, + { + "epoch": 0.15485468048042542, + "learning_rate": 0.0001690308975887045, + "loss": 0.9001, + "mean_token_accuracy": 0.7330372750759124, + "num_tokens": 39073130.0, + "step": 16890 + }, + { + "epoch": 0.15494636471990464, + "learning_rate": 0.00016901256074080867, + "loss": 0.8652, + "mean_token_accuracy": 0.7405720889568329, + "num_tokens": 39096834.0, + "step": 16900 + }, + { + "epoch": 0.1550380489593839, + "learning_rate": 0.0001689942238929128, + "loss": 0.8427, + "mean_token_accuracy": 0.7495450854301453, + "num_tokens": 39119212.0, + "step": 16910 + }, + { + "epoch": 0.1551297331988631, + "learning_rate": 0.00016897588704501698, + "loss": 0.8744, + "mean_token_accuracy": 0.7428697288036347, + "num_tokens": 39142979.0, + "step": 16920 + }, + { + "epoch": 0.15522141743834236, + "learning_rate": 0.00016895755019712111, + "loss": 0.9012, + "mean_token_accuracy": 0.7362680971622467, + "num_tokens": 39165585.0, + "step": 16930 + }, + { + "epoch": 0.15531310167782159, + "learning_rate": 0.00016893921334922528, + "loss": 0.8311, + "mean_token_accuracy": 0.7509696185588837, + "num_tokens": 39188522.0, + "step": 16940 + }, + { + "epoch": 0.1554047859173008, + "learning_rate": 0.00016892087650132945, + "loss": 0.9017, + "mean_token_accuracy": 0.7352629005908966, + "num_tokens": 39211450.0, + "step": 16950 + }, + { + "epoch": 0.15549647015678006, + "learning_rate": 0.00016890253965343358, + "loss": 0.8318, + "mean_token_accuracy": 0.7483528077602386, + "num_tokens": 39234302.0, + "step": 16960 + }, + { + "epoch": 0.15558815439625928, + "learning_rate": 0.00016888420280553775, + "loss": 0.8588, + "mean_token_accuracy": 0.7395950853824615, + "num_tokens": 39257127.0, + "step": 16970 + }, + { + "epoch": 0.1556798386357385, + "learning_rate": 0.0001688658659576419, + "loss": 0.8363, + "mean_token_accuracy": 0.7496638536453247, + "num_tokens": 39279972.0, + "step": 16980 + }, + { + "epoch": 0.15577152287521775, + "learning_rate": 0.00016884752910974603, + "loss": 0.8581, + "mean_token_accuracy": 0.7437224447727203, + "num_tokens": 39304175.0, + "step": 16990 + }, + { + "epoch": 0.15586320711469698, + "learning_rate": 0.0001688291922618502, + "loss": 0.8594, + "mean_token_accuracy": 0.7452760875225067, + "num_tokens": 39328003.0, + "step": 17000 + }, + { + "epoch": 0.15595489135417623, + "learning_rate": 0.00016881085541395433, + "loss": 0.8996, + "mean_token_accuracy": 0.7387515842914582, + "num_tokens": 39350914.0, + "step": 17010 + }, + { + "epoch": 0.15604657559365545, + "learning_rate": 0.00016879251856605852, + "loss": 0.8378, + "mean_token_accuracy": 0.7472789049148559, + "num_tokens": 39373506.0, + "step": 17020 + }, + { + "epoch": 0.15613825983313467, + "learning_rate": 0.00016877418171816266, + "loss": 0.8911, + "mean_token_accuracy": 0.7346392273902893, + "num_tokens": 39396798.0, + "step": 17030 + }, + { + "epoch": 0.15622994407261392, + "learning_rate": 0.0001687558448702668, + "loss": 0.8814, + "mean_token_accuracy": 0.7421307742595673, + "num_tokens": 39420214.0, + "step": 17040 + }, + { + "epoch": 0.15632162831209315, + "learning_rate": 0.00016873750802237096, + "loss": 0.8558, + "mean_token_accuracy": 0.7466699361801148, + "num_tokens": 39443028.0, + "step": 17050 + }, + { + "epoch": 0.1564133125515724, + "learning_rate": 0.0001687191711744751, + "loss": 0.8701, + "mean_token_accuracy": 0.7446559250354767, + "num_tokens": 39466517.0, + "step": 17060 + }, + { + "epoch": 0.15650499679105162, + "learning_rate": 0.00016870083432657927, + "loss": 0.9331, + "mean_token_accuracy": 0.7287180542945861, + "num_tokens": 39490932.0, + "step": 17070 + }, + { + "epoch": 0.15659668103053084, + "learning_rate": 0.00016868249747868343, + "loss": 0.8499, + "mean_token_accuracy": 0.7485387921333313, + "num_tokens": 39513849.0, + "step": 17080 + }, + { + "epoch": 0.1566883652700101, + "learning_rate": 0.00016866416063078757, + "loss": 0.8339, + "mean_token_accuracy": 0.7490086317062378, + "num_tokens": 39538317.0, + "step": 17090 + }, + { + "epoch": 0.15678004950948932, + "learning_rate": 0.00016864582378289174, + "loss": 0.8786, + "mean_token_accuracy": 0.7363821864128113, + "num_tokens": 39561298.0, + "step": 17100 + }, + { + "epoch": 0.15687173374896854, + "learning_rate": 0.00016862748693499588, + "loss": 0.873, + "mean_token_accuracy": 0.7386886358261109, + "num_tokens": 39583735.0, + "step": 17110 + }, + { + "epoch": 0.1569634179884478, + "learning_rate": 0.00016860915008710004, + "loss": 0.8882, + "mean_token_accuracy": 0.7353485643863678, + "num_tokens": 39606533.0, + "step": 17120 + }, + { + "epoch": 0.157055102227927, + "learning_rate": 0.00016859081323920418, + "loss": 0.9284, + "mean_token_accuracy": 0.7309687435626984, + "num_tokens": 39629313.0, + "step": 17130 + }, + { + "epoch": 0.15714678646740626, + "learning_rate": 0.00016857247639130834, + "loss": 0.8536, + "mean_token_accuracy": 0.7418226718902587, + "num_tokens": 39651940.0, + "step": 17140 + }, + { + "epoch": 0.15723847070688549, + "learning_rate": 0.0001685541395434125, + "loss": 0.8701, + "mean_token_accuracy": 0.7322404265403748, + "num_tokens": 39674810.0, + "step": 17150 + }, + { + "epoch": 0.1573301549463647, + "learning_rate": 0.00016853580269551665, + "loss": 0.9, + "mean_token_accuracy": 0.7297082722187043, + "num_tokens": 39698837.0, + "step": 17160 + }, + { + "epoch": 0.15742183918584396, + "learning_rate": 0.0001685174658476208, + "loss": 0.8814, + "mean_token_accuracy": 0.7342394649982452, + "num_tokens": 39721751.0, + "step": 17170 + }, + { + "epoch": 0.15751352342532318, + "learning_rate": 0.00016849912899972495, + "loss": 0.8597, + "mean_token_accuracy": 0.750165456533432, + "num_tokens": 39744338.0, + "step": 17180 + }, + { + "epoch": 0.15760520766480243, + "learning_rate": 0.0001684807921518291, + "loss": 0.8828, + "mean_token_accuracy": 0.736766242980957, + "num_tokens": 39768072.0, + "step": 17190 + }, + { + "epoch": 0.15769689190428166, + "learning_rate": 0.00016846245530393326, + "loss": 0.8625, + "mean_token_accuracy": 0.7397107303142547, + "num_tokens": 39791075.0, + "step": 17200 + }, + { + "epoch": 0.15778857614376088, + "learning_rate": 0.00016844411845603742, + "loss": 0.8736, + "mean_token_accuracy": 0.7415744304656983, + "num_tokens": 39814033.0, + "step": 17210 + }, + { + "epoch": 0.15788026038324013, + "learning_rate": 0.00016842578160814159, + "loss": 0.8237, + "mean_token_accuracy": 0.7556914150714874, + "num_tokens": 39838059.0, + "step": 17220 + }, + { + "epoch": 0.15797194462271935, + "learning_rate": 0.00016840744476024572, + "loss": 0.8579, + "mean_token_accuracy": 0.7471156656742096, + "num_tokens": 39861463.0, + "step": 17230 + }, + { + "epoch": 0.1580636288621986, + "learning_rate": 0.00016838910791234986, + "loss": 0.8737, + "mean_token_accuracy": 0.741560983657837, + "num_tokens": 39884397.0, + "step": 17240 + }, + { + "epoch": 0.15815531310167782, + "learning_rate": 0.00016837077106445403, + "loss": 0.8826, + "mean_token_accuracy": 0.738440752029419, + "num_tokens": 39907994.0, + "step": 17250 + }, + { + "epoch": 0.15824699734115705, + "learning_rate": 0.00016835243421655817, + "loss": 0.8741, + "mean_token_accuracy": 0.7396030426025391, + "num_tokens": 39930416.0, + "step": 17260 + }, + { + "epoch": 0.1583386815806363, + "learning_rate": 0.00016833409736866233, + "loss": 0.897, + "mean_token_accuracy": 0.7328746974468231, + "num_tokens": 39953552.0, + "step": 17270 + }, + { + "epoch": 0.15843036582011552, + "learning_rate": 0.0001683157605207665, + "loss": 0.8798, + "mean_token_accuracy": 0.7370184361934662, + "num_tokens": 39976687.0, + "step": 17280 + }, + { + "epoch": 0.15852205005959474, + "learning_rate": 0.00016829742367287064, + "loss": 0.8398, + "mean_token_accuracy": 0.7485899269580841, + "num_tokens": 40000792.0, + "step": 17290 + }, + { + "epoch": 0.158613734299074, + "learning_rate": 0.0001682790868249748, + "loss": 0.873, + "mean_token_accuracy": 0.7397284567356109, + "num_tokens": 40023544.0, + "step": 17300 + }, + { + "epoch": 0.15870541853855322, + "learning_rate": 0.00016826074997707894, + "loss": 0.8769, + "mean_token_accuracy": 0.7368694961071014, + "num_tokens": 40046236.0, + "step": 17310 + }, + { + "epoch": 0.15879710277803247, + "learning_rate": 0.0001682424131291831, + "loss": 0.8663, + "mean_token_accuracy": 0.7377434968948364, + "num_tokens": 40069467.0, + "step": 17320 + }, + { + "epoch": 0.1588887870175117, + "learning_rate": 0.00016822407628128724, + "loss": 0.9228, + "mean_token_accuracy": 0.733688759803772, + "num_tokens": 40092677.0, + "step": 17330 + }, + { + "epoch": 0.1589804712569909, + "learning_rate": 0.0001682057394333914, + "loss": 0.8815, + "mean_token_accuracy": 0.7415893852710724, + "num_tokens": 40115888.0, + "step": 17340 + }, + { + "epoch": 0.15907215549647016, + "learning_rate": 0.00016818740258549557, + "loss": 0.8612, + "mean_token_accuracy": 0.7410473346710205, + "num_tokens": 40138364.0, + "step": 17350 + }, + { + "epoch": 0.1591638397359494, + "learning_rate": 0.0001681690657375997, + "loss": 0.8853, + "mean_token_accuracy": 0.7327299773693084, + "num_tokens": 40161415.0, + "step": 17360 + }, + { + "epoch": 0.15925552397542864, + "learning_rate": 0.00016815072888970388, + "loss": 0.9074, + "mean_token_accuracy": 0.7273565292358398, + "num_tokens": 40184518.0, + "step": 17370 + }, + { + "epoch": 0.15934720821490786, + "learning_rate": 0.00016813239204180802, + "loss": 0.8358, + "mean_token_accuracy": 0.748268336057663, + "num_tokens": 40208537.0, + "step": 17380 + }, + { + "epoch": 0.15943889245438708, + "learning_rate": 0.00016811405519391215, + "loss": 0.8466, + "mean_token_accuracy": 0.7444461345672607, + "num_tokens": 40231126.0, + "step": 17390 + }, + { + "epoch": 0.15953057669386633, + "learning_rate": 0.00016809571834601632, + "loss": 0.8726, + "mean_token_accuracy": 0.7356184244155883, + "num_tokens": 40253514.0, + "step": 17400 + }, + { + "epoch": 0.15962226093334556, + "learning_rate": 0.00016807738149812049, + "loss": 0.8935, + "mean_token_accuracy": 0.7391709446907043, + "num_tokens": 40276077.0, + "step": 17410 + }, + { + "epoch": 0.15971394517282478, + "learning_rate": 0.00016805904465022465, + "loss": 0.8631, + "mean_token_accuracy": 0.7399099051952363, + "num_tokens": 40299076.0, + "step": 17420 + }, + { + "epoch": 0.15980562941230403, + "learning_rate": 0.0001680407078023288, + "loss": 0.8573, + "mean_token_accuracy": 0.7385023057460784, + "num_tokens": 40321935.0, + "step": 17430 + }, + { + "epoch": 0.15989731365178325, + "learning_rate": 0.00016802237095443293, + "loss": 0.8413, + "mean_token_accuracy": 0.7480131924152374, + "num_tokens": 40344781.0, + "step": 17440 + }, + { + "epoch": 0.1599889978912625, + "learning_rate": 0.0001680040341065371, + "loss": 0.862, + "mean_token_accuracy": 0.7477836430072784, + "num_tokens": 40368409.0, + "step": 17450 + }, + { + "epoch": 0.16008068213074172, + "learning_rate": 0.00016798569725864123, + "loss": 0.8624, + "mean_token_accuracy": 0.7396600663661956, + "num_tokens": 40391838.0, + "step": 17460 + }, + { + "epoch": 0.16017236637022095, + "learning_rate": 0.00016796736041074542, + "loss": 0.8757, + "mean_token_accuracy": 0.744785076379776, + "num_tokens": 40414894.0, + "step": 17470 + }, + { + "epoch": 0.1602640506097002, + "learning_rate": 0.00016794902356284956, + "loss": 0.8487, + "mean_token_accuracy": 0.74610915184021, + "num_tokens": 40437014.0, + "step": 17480 + }, + { + "epoch": 0.16035573484917942, + "learning_rate": 0.0001679306867149537, + "loss": 0.8606, + "mean_token_accuracy": 0.7441764593124389, + "num_tokens": 40459884.0, + "step": 17490 + }, + { + "epoch": 0.16044741908865867, + "learning_rate": 0.00016791234986705787, + "loss": 0.8633, + "mean_token_accuracy": 0.7488744735717774, + "num_tokens": 40483174.0, + "step": 17500 + }, + { + "epoch": 0.1605391033281379, + "learning_rate": 0.000167894013019162, + "loss": 0.8736, + "mean_token_accuracy": 0.7425401151180268, + "num_tokens": 40505775.0, + "step": 17510 + }, + { + "epoch": 0.16063078756761712, + "learning_rate": 0.00016787567617126617, + "loss": 0.8412, + "mean_token_accuracy": 0.7526976048946381, + "num_tokens": 40528854.0, + "step": 17520 + }, + { + "epoch": 0.16072247180709637, + "learning_rate": 0.0001678573393233703, + "loss": 0.8519, + "mean_token_accuracy": 0.7444073617458343, + "num_tokens": 40552442.0, + "step": 17530 + }, + { + "epoch": 0.1608141560465756, + "learning_rate": 0.00016783900247547447, + "loss": 0.8215, + "mean_token_accuracy": 0.7446524620056152, + "num_tokens": 40575262.0, + "step": 17540 + }, + { + "epoch": 0.16090584028605484, + "learning_rate": 0.00016782066562757864, + "loss": 0.9047, + "mean_token_accuracy": 0.7284642696380615, + "num_tokens": 40598247.0, + "step": 17550 + }, + { + "epoch": 0.16099752452553406, + "learning_rate": 0.00016780232877968278, + "loss": 0.8789, + "mean_token_accuracy": 0.7382528483867645, + "num_tokens": 40621385.0, + "step": 17560 + }, + { + "epoch": 0.1610892087650133, + "learning_rate": 0.00016778399193178694, + "loss": 0.8442, + "mean_token_accuracy": 0.7507353901863099, + "num_tokens": 40644241.0, + "step": 17570 + }, + { + "epoch": 0.16118089300449254, + "learning_rate": 0.00016776565508389108, + "loss": 0.8523, + "mean_token_accuracy": 0.7480726540088654, + "num_tokens": 40667355.0, + "step": 17580 + }, + { + "epoch": 0.16127257724397176, + "learning_rate": 0.00016774731823599522, + "loss": 0.9176, + "mean_token_accuracy": 0.7309023559093475, + "num_tokens": 40690723.0, + "step": 17590 + }, + { + "epoch": 0.16136426148345098, + "learning_rate": 0.0001677289813880994, + "loss": 0.8678, + "mean_token_accuracy": 0.7350658476352692, + "num_tokens": 40713685.0, + "step": 17600 + }, + { + "epoch": 0.16145594572293023, + "learning_rate": 0.00016771064454020355, + "loss": 0.883, + "mean_token_accuracy": 0.7347937643527984, + "num_tokens": 40737807.0, + "step": 17610 + }, + { + "epoch": 0.16154762996240946, + "learning_rate": 0.00016769230769230772, + "loss": 0.8602, + "mean_token_accuracy": 0.7383953213691712, + "num_tokens": 40760836.0, + "step": 17620 + }, + { + "epoch": 0.1616393142018887, + "learning_rate": 0.00016767397084441185, + "loss": 0.8989, + "mean_token_accuracy": 0.7323030471801758, + "num_tokens": 40783731.0, + "step": 17630 + }, + { + "epoch": 0.16173099844136793, + "learning_rate": 0.000167655633996516, + "loss": 0.8462, + "mean_token_accuracy": 0.7501704514026641, + "num_tokens": 40806410.0, + "step": 17640 + }, + { + "epoch": 0.16182268268084715, + "learning_rate": 0.00016763729714862016, + "loss": 0.8738, + "mean_token_accuracy": 0.7390379190444947, + "num_tokens": 40830395.0, + "step": 17650 + }, + { + "epoch": 0.1619143669203264, + "learning_rate": 0.0001676189603007243, + "loss": 0.8263, + "mean_token_accuracy": 0.7556713819503784, + "num_tokens": 40853533.0, + "step": 17660 + }, + { + "epoch": 0.16200605115980563, + "learning_rate": 0.0001676006234528285, + "loss": 0.8509, + "mean_token_accuracy": 0.7434868693351746, + "num_tokens": 40877452.0, + "step": 17670 + }, + { + "epoch": 0.16209773539928488, + "learning_rate": 0.00016758228660493263, + "loss": 0.8279, + "mean_token_accuracy": 0.7525975346565247, + "num_tokens": 40900679.0, + "step": 17680 + }, + { + "epoch": 0.1621894196387641, + "learning_rate": 0.00016756394975703676, + "loss": 0.8429, + "mean_token_accuracy": 0.7483399212360382, + "num_tokens": 40923667.0, + "step": 17690 + }, + { + "epoch": 0.16228110387824332, + "learning_rate": 0.00016754561290914093, + "loss": 0.8558, + "mean_token_accuracy": 0.7391563951969147, + "num_tokens": 40946901.0, + "step": 17700 + }, + { + "epoch": 0.16237278811772257, + "learning_rate": 0.00016752727606124507, + "loss": 0.8968, + "mean_token_accuracy": 0.7328025579452515, + "num_tokens": 40970559.0, + "step": 17710 + }, + { + "epoch": 0.1624644723572018, + "learning_rate": 0.00016750893921334923, + "loss": 0.8767, + "mean_token_accuracy": 0.7393238782882691, + "num_tokens": 40994083.0, + "step": 17720 + }, + { + "epoch": 0.16255615659668102, + "learning_rate": 0.0001674906023654534, + "loss": 0.9021, + "mean_token_accuracy": 0.7304047882556916, + "num_tokens": 41017443.0, + "step": 17730 + }, + { + "epoch": 0.16264784083616027, + "learning_rate": 0.00016747226551755754, + "loss": 0.8565, + "mean_token_accuracy": 0.7497427701950073, + "num_tokens": 41040736.0, + "step": 17740 + }, + { + "epoch": 0.1627395250756395, + "learning_rate": 0.0001674539286696617, + "loss": 0.8527, + "mean_token_accuracy": 0.7382766842842102, + "num_tokens": 41063711.0, + "step": 17750 + }, + { + "epoch": 0.16283120931511874, + "learning_rate": 0.00016743559182176584, + "loss": 0.8953, + "mean_token_accuracy": 0.7397700190544129, + "num_tokens": 41086464.0, + "step": 17760 + }, + { + "epoch": 0.16292289355459796, + "learning_rate": 0.00016741725497387, + "loss": 0.8306, + "mean_token_accuracy": 0.7546618223190308, + "num_tokens": 41110300.0, + "step": 17770 + }, + { + "epoch": 0.1630145777940772, + "learning_rate": 0.00016739891812597415, + "loss": 0.9008, + "mean_token_accuracy": 0.7381853759288788, + "num_tokens": 41133380.0, + "step": 17780 + }, + { + "epoch": 0.16310626203355644, + "learning_rate": 0.00016738058127807828, + "loss": 0.8659, + "mean_token_accuracy": 0.7472920775413513, + "num_tokens": 41157213.0, + "step": 17790 + }, + { + "epoch": 0.16319794627303566, + "learning_rate": 0.00016736224443018248, + "loss": 0.8839, + "mean_token_accuracy": 0.7403927803039551, + "num_tokens": 41180107.0, + "step": 17800 + }, + { + "epoch": 0.1632896305125149, + "learning_rate": 0.00016734390758228661, + "loss": 0.8435, + "mean_token_accuracy": 0.7507363438606263, + "num_tokens": 41203089.0, + "step": 17810 + }, + { + "epoch": 0.16338131475199413, + "learning_rate": 0.00016732557073439078, + "loss": 0.8605, + "mean_token_accuracy": 0.7463716804981232, + "num_tokens": 41226464.0, + "step": 17820 + }, + { + "epoch": 0.16347299899147336, + "learning_rate": 0.00016730723388649492, + "loss": 0.8599, + "mean_token_accuracy": 0.7399094104766846, + "num_tokens": 41249910.0, + "step": 17830 + }, + { + "epoch": 0.1635646832309526, + "learning_rate": 0.00016728889703859906, + "loss": 0.8544, + "mean_token_accuracy": 0.744236272573471, + "num_tokens": 41273470.0, + "step": 17840 + }, + { + "epoch": 0.16365636747043183, + "learning_rate": 0.00016727056019070322, + "loss": 0.88, + "mean_token_accuracy": 0.7369423568248749, + "num_tokens": 41297073.0, + "step": 17850 + }, + { + "epoch": 0.16374805170991108, + "learning_rate": 0.0001672522233428074, + "loss": 0.8834, + "mean_token_accuracy": 0.7375329375267029, + "num_tokens": 41319820.0, + "step": 17860 + }, + { + "epoch": 0.1638397359493903, + "learning_rate": 0.00016723388649491155, + "loss": 0.8611, + "mean_token_accuracy": 0.7408622324466705, + "num_tokens": 41343302.0, + "step": 17870 + }, + { + "epoch": 0.16393142018886953, + "learning_rate": 0.0001672155496470157, + "loss": 0.8906, + "mean_token_accuracy": 0.7352072417736053, + "num_tokens": 41366200.0, + "step": 17880 + }, + { + "epoch": 0.16402310442834878, + "learning_rate": 0.00016719721279911983, + "loss": 0.8648, + "mean_token_accuracy": 0.7434074938297272, + "num_tokens": 41389922.0, + "step": 17890 + }, + { + "epoch": 0.164114788667828, + "learning_rate": 0.000167178875951224, + "loss": 0.872, + "mean_token_accuracy": 0.7438861548900604, + "num_tokens": 41412672.0, + "step": 17900 + }, + { + "epoch": 0.16420647290730722, + "learning_rate": 0.00016716053910332813, + "loss": 0.8794, + "mean_token_accuracy": 0.7390958905220032, + "num_tokens": 41435521.0, + "step": 17910 + }, + { + "epoch": 0.16429815714678647, + "learning_rate": 0.0001671422022554323, + "loss": 0.8893, + "mean_token_accuracy": 0.7348230957984925, + "num_tokens": 41458368.0, + "step": 17920 + }, + { + "epoch": 0.1643898413862657, + "learning_rate": 0.00016712386540753646, + "loss": 0.888, + "mean_token_accuracy": 0.7326744616031646, + "num_tokens": 41481181.0, + "step": 17930 + }, + { + "epoch": 0.16448152562574495, + "learning_rate": 0.0001671055285596406, + "loss": 0.8587, + "mean_token_accuracy": 0.7451447486877442, + "num_tokens": 41504551.0, + "step": 17940 + }, + { + "epoch": 0.16457320986522417, + "learning_rate": 0.00016708719171174477, + "loss": 0.8908, + "mean_token_accuracy": 0.7369565606117249, + "num_tokens": 41527906.0, + "step": 17950 + }, + { + "epoch": 0.1646648941047034, + "learning_rate": 0.0001670688548638489, + "loss": 0.8823, + "mean_token_accuracy": 0.7395092904567718, + "num_tokens": 41550696.0, + "step": 17960 + }, + { + "epoch": 0.16475657834418264, + "learning_rate": 0.00016705051801595307, + "loss": 0.8643, + "mean_token_accuracy": 0.7378550350666047, + "num_tokens": 41573912.0, + "step": 17970 + }, + { + "epoch": 0.16484826258366186, + "learning_rate": 0.0001670321811680572, + "loss": 0.8576, + "mean_token_accuracy": 0.7506725192070007, + "num_tokens": 41596736.0, + "step": 17980 + }, + { + "epoch": 0.16493994682314111, + "learning_rate": 0.00016701384432016135, + "loss": 0.8617, + "mean_token_accuracy": 0.745305860042572, + "num_tokens": 41620143.0, + "step": 17990 + }, + { + "epoch": 0.16503163106262034, + "learning_rate": 0.00016699550747226554, + "loss": 0.8615, + "mean_token_accuracy": 0.7396979570388794, + "num_tokens": 41642888.0, + "step": 18000 + }, + { + "epoch": 0.16512331530209956, + "learning_rate": 0.00016697717062436968, + "loss": 0.8763, + "mean_token_accuracy": 0.7461963713169097, + "num_tokens": 41666072.0, + "step": 18010 + }, + { + "epoch": 0.1652149995415788, + "learning_rate": 0.00016695883377647384, + "loss": 0.8467, + "mean_token_accuracy": 0.7509789228439331, + "num_tokens": 41689047.0, + "step": 18020 + }, + { + "epoch": 0.16530668378105803, + "learning_rate": 0.00016694049692857798, + "loss": 0.8528, + "mean_token_accuracy": 0.7466614663600921, + "num_tokens": 41711812.0, + "step": 18030 + }, + { + "epoch": 0.16539836802053726, + "learning_rate": 0.00016692216008068212, + "loss": 0.8595, + "mean_token_accuracy": 0.7391000628471375, + "num_tokens": 41734735.0, + "step": 18040 + }, + { + "epoch": 0.1654900522600165, + "learning_rate": 0.00016690382323278629, + "loss": 0.8296, + "mean_token_accuracy": 0.7464460790157318, + "num_tokens": 41758220.0, + "step": 18050 + }, + { + "epoch": 0.16558173649949573, + "learning_rate": 0.00016688548638489045, + "loss": 0.8485, + "mean_token_accuracy": 0.7436749279499054, + "num_tokens": 41780829.0, + "step": 18060 + }, + { + "epoch": 0.16567342073897498, + "learning_rate": 0.00016686714953699462, + "loss": 0.9127, + "mean_token_accuracy": 0.7377270340919495, + "num_tokens": 41804318.0, + "step": 18070 + }, + { + "epoch": 0.1657651049784542, + "learning_rate": 0.00016684881268909876, + "loss": 0.8736, + "mean_token_accuracy": 0.7382775187492371, + "num_tokens": 41827759.0, + "step": 18080 + }, + { + "epoch": 0.16585678921793343, + "learning_rate": 0.0001668304758412029, + "loss": 0.8922, + "mean_token_accuracy": 0.73809455037117, + "num_tokens": 41851849.0, + "step": 18090 + }, + { + "epoch": 0.16594847345741268, + "learning_rate": 0.00016681213899330706, + "loss": 0.8676, + "mean_token_accuracy": 0.7345297038555145, + "num_tokens": 41875334.0, + "step": 18100 + }, + { + "epoch": 0.1660401576968919, + "learning_rate": 0.0001667938021454112, + "loss": 0.8805, + "mean_token_accuracy": 0.7380764663219452, + "num_tokens": 41898370.0, + "step": 18110 + }, + { + "epoch": 0.16613184193637115, + "learning_rate": 0.00016677546529751536, + "loss": 0.8565, + "mean_token_accuracy": 0.7484489917755127, + "num_tokens": 41920790.0, + "step": 18120 + }, + { + "epoch": 0.16622352617585037, + "learning_rate": 0.00016675712844961953, + "loss": 0.8562, + "mean_token_accuracy": 0.7416860640048981, + "num_tokens": 41943929.0, + "step": 18130 + }, + { + "epoch": 0.1663152104153296, + "learning_rate": 0.00016673879160172367, + "loss": 0.8774, + "mean_token_accuracy": 0.7420123457908631, + "num_tokens": 41967118.0, + "step": 18140 + }, + { + "epoch": 0.16640689465480885, + "learning_rate": 0.00016672045475382783, + "loss": 0.8264, + "mean_token_accuracy": 0.7512724161148071, + "num_tokens": 41990403.0, + "step": 18150 + }, + { + "epoch": 0.16649857889428807, + "learning_rate": 0.00016670211790593197, + "loss": 0.8437, + "mean_token_accuracy": 0.7459653854370117, + "num_tokens": 42013721.0, + "step": 18160 + }, + { + "epoch": 0.16659026313376732, + "learning_rate": 0.00016668378105803614, + "loss": 0.8881, + "mean_token_accuracy": 0.7412309527397156, + "num_tokens": 42037341.0, + "step": 18170 + }, + { + "epoch": 0.16668194737324654, + "learning_rate": 0.00016666544421014027, + "loss": 0.8493, + "mean_token_accuracy": 0.7402162849903107, + "num_tokens": 42060495.0, + "step": 18180 + }, + { + "epoch": 0.16677363161272576, + "learning_rate": 0.00016664710736224444, + "loss": 0.8624, + "mean_token_accuracy": 0.7407247722148895, + "num_tokens": 42084480.0, + "step": 18190 + }, + { + "epoch": 0.16686531585220502, + "learning_rate": 0.0001666287705143486, + "loss": 0.8826, + "mean_token_accuracy": 0.7436165332794189, + "num_tokens": 42107356.0, + "step": 18200 + }, + { + "epoch": 0.16695700009168424, + "learning_rate": 0.00016661043366645274, + "loss": 0.8558, + "mean_token_accuracy": 0.7454732954502106, + "num_tokens": 42131261.0, + "step": 18210 + }, + { + "epoch": 0.16704868433116346, + "learning_rate": 0.0001665920968185569, + "loss": 0.8923, + "mean_token_accuracy": 0.7352973461151123, + "num_tokens": 42154529.0, + "step": 18220 + }, + { + "epoch": 0.1671403685706427, + "learning_rate": 0.00016657375997066105, + "loss": 0.867, + "mean_token_accuracy": 0.7395649433135987, + "num_tokens": 42177293.0, + "step": 18230 + }, + { + "epoch": 0.16723205281012193, + "learning_rate": 0.00016655542312276519, + "loss": 0.8969, + "mean_token_accuracy": 0.7318514168262482, + "num_tokens": 42201043.0, + "step": 18240 + }, + { + "epoch": 0.16732373704960118, + "learning_rate": 0.00016653708627486935, + "loss": 0.862, + "mean_token_accuracy": 0.7404728889465332, + "num_tokens": 42224080.0, + "step": 18250 + }, + { + "epoch": 0.1674154212890804, + "learning_rate": 0.00016651874942697352, + "loss": 0.901, + "mean_token_accuracy": 0.7297580242156982, + "num_tokens": 42246844.0, + "step": 18260 + }, + { + "epoch": 0.16750710552855963, + "learning_rate": 0.00016650041257907768, + "loss": 0.886, + "mean_token_accuracy": 0.737334668636322, + "num_tokens": 42270168.0, + "step": 18270 + }, + { + "epoch": 0.16759878976803888, + "learning_rate": 0.00016648207573118182, + "loss": 0.8799, + "mean_token_accuracy": 0.745305997133255, + "num_tokens": 42293055.0, + "step": 18280 + }, + { + "epoch": 0.1676904740075181, + "learning_rate": 0.00016646373888328596, + "loss": 0.8566, + "mean_token_accuracy": 0.7517912030220032, + "num_tokens": 42317077.0, + "step": 18290 + }, + { + "epoch": 0.16778215824699735, + "learning_rate": 0.00016644540203539012, + "loss": 0.8818, + "mean_token_accuracy": 0.739583021402359, + "num_tokens": 42340461.0, + "step": 18300 + }, + { + "epoch": 0.16787384248647658, + "learning_rate": 0.00016642706518749426, + "loss": 0.8967, + "mean_token_accuracy": 0.7339466094970704, + "num_tokens": 42363235.0, + "step": 18310 + }, + { + "epoch": 0.1679655267259558, + "learning_rate": 0.00016640872833959845, + "loss": 0.8746, + "mean_token_accuracy": 0.7352726817131042, + "num_tokens": 42385965.0, + "step": 18320 + }, + { + "epoch": 0.16805721096543505, + "learning_rate": 0.0001663903914917026, + "loss": 0.8375, + "mean_token_accuracy": 0.747681075334549, + "num_tokens": 42409057.0, + "step": 18330 + }, + { + "epoch": 0.16814889520491427, + "learning_rate": 0.00016637205464380673, + "loss": 0.8451, + "mean_token_accuracy": 0.7485225677490235, + "num_tokens": 42432307.0, + "step": 18340 + }, + { + "epoch": 0.1682405794443935, + "learning_rate": 0.0001663537177959109, + "loss": 0.883, + "mean_token_accuracy": 0.7471256136894227, + "num_tokens": 42455741.0, + "step": 18350 + }, + { + "epoch": 0.16833226368387275, + "learning_rate": 0.00016633538094801503, + "loss": 0.8828, + "mean_token_accuracy": 0.7374133229255676, + "num_tokens": 42479199.0, + "step": 18360 + }, + { + "epoch": 0.16842394792335197, + "learning_rate": 0.0001663170441001192, + "loss": 0.8592, + "mean_token_accuracy": 0.7457978844642639, + "num_tokens": 42502926.0, + "step": 18370 + }, + { + "epoch": 0.16851563216283122, + "learning_rate": 0.00016629870725222334, + "loss": 0.8568, + "mean_token_accuracy": 0.7415787398815155, + "num_tokens": 42525572.0, + "step": 18380 + }, + { + "epoch": 0.16860731640231044, + "learning_rate": 0.0001662803704043275, + "loss": 0.8406, + "mean_token_accuracy": 0.7437069296836853, + "num_tokens": 42548672.0, + "step": 18390 + }, + { + "epoch": 0.16869900064178966, + "learning_rate": 0.00016626203355643167, + "loss": 0.8605, + "mean_token_accuracy": 0.7456466615200043, + "num_tokens": 42571442.0, + "step": 18400 + }, + { + "epoch": 0.16879068488126892, + "learning_rate": 0.0001662436967085358, + "loss": 0.8847, + "mean_token_accuracy": 0.7428866684436798, + "num_tokens": 42595266.0, + "step": 18410 + }, + { + "epoch": 0.16888236912074814, + "learning_rate": 0.00016622535986063997, + "loss": 0.8631, + "mean_token_accuracy": 0.7364484310150147, + "num_tokens": 42618549.0, + "step": 18420 + }, + { + "epoch": 0.1689740533602274, + "learning_rate": 0.0001662070230127441, + "loss": 0.8511, + "mean_token_accuracy": 0.7413220882415772, + "num_tokens": 42641416.0, + "step": 18430 + }, + { + "epoch": 0.1690657375997066, + "learning_rate": 0.00016618868616484825, + "loss": 0.8551, + "mean_token_accuracy": 0.7441992104053498, + "num_tokens": 42664003.0, + "step": 18440 + }, + { + "epoch": 0.16915742183918583, + "learning_rate": 0.00016617034931695244, + "loss": 0.8622, + "mean_token_accuracy": 0.744612205028534, + "num_tokens": 42686954.0, + "step": 18450 + }, + { + "epoch": 0.16924910607866508, + "learning_rate": 0.00016615201246905658, + "loss": 0.8922, + "mean_token_accuracy": 0.7364725351333619, + "num_tokens": 42710534.0, + "step": 18460 + }, + { + "epoch": 0.1693407903181443, + "learning_rate": 0.00016613367562116075, + "loss": 0.8191, + "mean_token_accuracy": 0.7570809066295624, + "num_tokens": 42733186.0, + "step": 18470 + }, + { + "epoch": 0.16943247455762356, + "learning_rate": 0.00016611533877326488, + "loss": 0.8987, + "mean_token_accuracy": 0.7353633105754852, + "num_tokens": 42756712.0, + "step": 18480 + }, + { + "epoch": 0.16952415879710278, + "learning_rate": 0.00016609700192536902, + "loss": 0.8761, + "mean_token_accuracy": 0.734033203125, + "num_tokens": 42781296.0, + "step": 18490 + }, + { + "epoch": 0.169615843036582, + "learning_rate": 0.0001660786650774732, + "loss": 0.8536, + "mean_token_accuracy": 0.7415765881538391, + "num_tokens": 42804319.0, + "step": 18500 + }, + { + "epoch": 0.16970752727606125, + "learning_rate": 0.00016606032822957733, + "loss": 0.8375, + "mean_token_accuracy": 0.7495999097824096, + "num_tokens": 42827149.0, + "step": 18510 + }, + { + "epoch": 0.16979921151554048, + "learning_rate": 0.00016604199138168152, + "loss": 0.8976, + "mean_token_accuracy": 0.7378803551197052, + "num_tokens": 42850539.0, + "step": 18520 + }, + { + "epoch": 0.1698908957550197, + "learning_rate": 0.00016602365453378566, + "loss": 0.8484, + "mean_token_accuracy": 0.7473590672016144, + "num_tokens": 42873882.0, + "step": 18530 + }, + { + "epoch": 0.16998257999449895, + "learning_rate": 0.0001660053176858898, + "loss": 0.8542, + "mean_token_accuracy": 0.7415569961071015, + "num_tokens": 42897100.0, + "step": 18540 + }, + { + "epoch": 0.17007426423397817, + "learning_rate": 0.00016598698083799396, + "loss": 0.8384, + "mean_token_accuracy": 0.7476524829864502, + "num_tokens": 42920015.0, + "step": 18550 + }, + { + "epoch": 0.17016594847345742, + "learning_rate": 0.0001659686439900981, + "loss": 0.8643, + "mean_token_accuracy": 0.7376882374286652, + "num_tokens": 42943162.0, + "step": 18560 + }, + { + "epoch": 0.17025763271293665, + "learning_rate": 0.00016595030714220226, + "loss": 0.8767, + "mean_token_accuracy": 0.7456963539123536, + "num_tokens": 42966756.0, + "step": 18570 + }, + { + "epoch": 0.17034931695241587, + "learning_rate": 0.00016593197029430643, + "loss": 0.8904, + "mean_token_accuracy": 0.745152348279953, + "num_tokens": 42989343.0, + "step": 18580 + }, + { + "epoch": 0.17044100119189512, + "learning_rate": 0.00016591363344641057, + "loss": 0.8785, + "mean_token_accuracy": 0.7373985052108765, + "num_tokens": 43012254.0, + "step": 18590 + }, + { + "epoch": 0.17053268543137434, + "learning_rate": 0.00016589529659851473, + "loss": 0.8575, + "mean_token_accuracy": 0.746576726436615, + "num_tokens": 43035654.0, + "step": 18600 + }, + { + "epoch": 0.1706243696708536, + "learning_rate": 0.00016587695975061887, + "loss": 0.8701, + "mean_token_accuracy": 0.7436378777027131, + "num_tokens": 43058202.0, + "step": 18610 + }, + { + "epoch": 0.17071605391033282, + "learning_rate": 0.00016585862290272304, + "loss": 0.8553, + "mean_token_accuracy": 0.7430861413478851, + "num_tokens": 43081274.0, + "step": 18620 + }, + { + "epoch": 0.17080773814981204, + "learning_rate": 0.00016584028605482718, + "loss": 0.8635, + "mean_token_accuracy": 0.7420690774917602, + "num_tokens": 43104564.0, + "step": 18630 + }, + { + "epoch": 0.1708994223892913, + "learning_rate": 0.00016582194920693131, + "loss": 0.8657, + "mean_token_accuracy": 0.7420691609382629, + "num_tokens": 43127185.0, + "step": 18640 + }, + { + "epoch": 0.1709911066287705, + "learning_rate": 0.0001658036123590355, + "loss": 0.8493, + "mean_token_accuracy": 0.7503941476345062, + "num_tokens": 43149937.0, + "step": 18650 + }, + { + "epoch": 0.17108279086824973, + "learning_rate": 0.00016578527551113964, + "loss": 0.8751, + "mean_token_accuracy": 0.7426930785179138, + "num_tokens": 43173374.0, + "step": 18660 + }, + { + "epoch": 0.17117447510772899, + "learning_rate": 0.0001657669386632438, + "loss": 0.8475, + "mean_token_accuracy": 0.7485217332839966, + "num_tokens": 43196583.0, + "step": 18670 + }, + { + "epoch": 0.1712661593472082, + "learning_rate": 0.00016574860181534795, + "loss": 0.8932, + "mean_token_accuracy": 0.7311478614807129, + "num_tokens": 43219366.0, + "step": 18680 + }, + { + "epoch": 0.17135784358668746, + "learning_rate": 0.0001657302649674521, + "loss": 0.8403, + "mean_token_accuracy": 0.7468105971813201, + "num_tokens": 43242694.0, + "step": 18690 + }, + { + "epoch": 0.17144952782616668, + "learning_rate": 0.00016571192811955625, + "loss": 0.8767, + "mean_token_accuracy": 0.7375354588031768, + "num_tokens": 43265614.0, + "step": 18700 + }, + { + "epoch": 0.1715412120656459, + "learning_rate": 0.00016569359127166042, + "loss": 0.8935, + "mean_token_accuracy": 0.7387665510177612, + "num_tokens": 43289693.0, + "step": 18710 + }, + { + "epoch": 0.17163289630512515, + "learning_rate": 0.00016567525442376458, + "loss": 0.901, + "mean_token_accuracy": 0.7406913757324218, + "num_tokens": 43312562.0, + "step": 18720 + }, + { + "epoch": 0.17172458054460438, + "learning_rate": 0.00016565691757586872, + "loss": 0.8671, + "mean_token_accuracy": 0.7439317822456359, + "num_tokens": 43336606.0, + "step": 18730 + }, + { + "epoch": 0.17181626478408363, + "learning_rate": 0.00016563858072797286, + "loss": 0.8827, + "mean_token_accuracy": 0.745622968673706, + "num_tokens": 43359267.0, + "step": 18740 + }, + { + "epoch": 0.17190794902356285, + "learning_rate": 0.00016562024388007703, + "loss": 0.8614, + "mean_token_accuracy": 0.7413673400878906, + "num_tokens": 43381707.0, + "step": 18750 + }, + { + "epoch": 0.17199963326304207, + "learning_rate": 0.00016560190703218116, + "loss": 0.8815, + "mean_token_accuracy": 0.7391298234462738, + "num_tokens": 43404642.0, + "step": 18760 + }, + { + "epoch": 0.17209131750252132, + "learning_rate": 0.00016558357018428533, + "loss": 0.8286, + "mean_token_accuracy": 0.749553632736206, + "num_tokens": 43427570.0, + "step": 18770 + }, + { + "epoch": 0.17218300174200055, + "learning_rate": 0.0001655652333363895, + "loss": 0.8664, + "mean_token_accuracy": 0.7399058640003204, + "num_tokens": 43450522.0, + "step": 18780 + }, + { + "epoch": 0.1722746859814798, + "learning_rate": 0.00016554689648849363, + "loss": 0.8819, + "mean_token_accuracy": 0.7367096960544586, + "num_tokens": 43474693.0, + "step": 18790 + }, + { + "epoch": 0.17236637022095902, + "learning_rate": 0.0001655285596405978, + "loss": 0.8765, + "mean_token_accuracy": 0.745033347606659, + "num_tokens": 43497467.0, + "step": 18800 + }, + { + "epoch": 0.17245805446043824, + "learning_rate": 0.00016551022279270194, + "loss": 0.8341, + "mean_token_accuracy": 0.7419469773769378, + "num_tokens": 43520604.0, + "step": 18810 + }, + { + "epoch": 0.1725497386999175, + "learning_rate": 0.0001654918859448061, + "loss": 0.8581, + "mean_token_accuracy": 0.7410984992980957, + "num_tokens": 43543484.0, + "step": 18820 + }, + { + "epoch": 0.17264142293939672, + "learning_rate": 0.00016547354909691024, + "loss": 0.8622, + "mean_token_accuracy": 0.7435258150100708, + "num_tokens": 43566599.0, + "step": 18830 + }, + { + "epoch": 0.17273310717887594, + "learning_rate": 0.0001654552122490144, + "loss": 0.8831, + "mean_token_accuracy": 0.7390017509460449, + "num_tokens": 43589880.0, + "step": 18840 + }, + { + "epoch": 0.1728247914183552, + "learning_rate": 0.00016543687540111857, + "loss": 0.8222, + "mean_token_accuracy": 0.7479391753673553, + "num_tokens": 43613401.0, + "step": 18850 + }, + { + "epoch": 0.1729164756578344, + "learning_rate": 0.0001654185385532227, + "loss": 0.8804, + "mean_token_accuracy": 0.7409896969795227, + "num_tokens": 43636740.0, + "step": 18860 + }, + { + "epoch": 0.17300815989731366, + "learning_rate": 0.00016540020170532687, + "loss": 0.9086, + "mean_token_accuracy": 0.7395063579082489, + "num_tokens": 43659994.0, + "step": 18870 + }, + { + "epoch": 0.17309984413679289, + "learning_rate": 0.000165381864857431, + "loss": 0.8353, + "mean_token_accuracy": 0.7457105338573455, + "num_tokens": 43683450.0, + "step": 18880 + }, + { + "epoch": 0.1731915283762721, + "learning_rate": 0.00016536352800953515, + "loss": 0.8514, + "mean_token_accuracy": 0.7494057893753052, + "num_tokens": 43706137.0, + "step": 18890 + }, + { + "epoch": 0.17328321261575136, + "learning_rate": 0.00016534519116163932, + "loss": 0.8835, + "mean_token_accuracy": 0.7364172041416168, + "num_tokens": 43729224.0, + "step": 18900 + }, + { + "epoch": 0.17337489685523058, + "learning_rate": 0.00016532685431374348, + "loss": 0.8394, + "mean_token_accuracy": 0.7496098220348358, + "num_tokens": 43751460.0, + "step": 18910 + }, + { + "epoch": 0.17346658109470983, + "learning_rate": 0.00016530851746584765, + "loss": 0.8153, + "mean_token_accuracy": 0.7558809697628022, + "num_tokens": 43774059.0, + "step": 18920 + }, + { + "epoch": 0.17355826533418905, + "learning_rate": 0.00016529018061795179, + "loss": 0.882, + "mean_token_accuracy": 0.7378742516040802, + "num_tokens": 43797321.0, + "step": 18930 + }, + { + "epoch": 0.17364994957366828, + "learning_rate": 0.00016527184377005592, + "loss": 0.8832, + "mean_token_accuracy": 0.7422385215759277, + "num_tokens": 43820304.0, + "step": 18940 + }, + { + "epoch": 0.17374163381314753, + "learning_rate": 0.0001652535069221601, + "loss": 0.8728, + "mean_token_accuracy": 0.7387481093406677, + "num_tokens": 43843406.0, + "step": 18950 + }, + { + "epoch": 0.17383331805262675, + "learning_rate": 0.00016523517007426423, + "loss": 0.8709, + "mean_token_accuracy": 0.7417144775390625, + "num_tokens": 43866202.0, + "step": 18960 + }, + { + "epoch": 0.17392500229210597, + "learning_rate": 0.0001652168332263684, + "loss": 0.8615, + "mean_token_accuracy": 0.7436456739902496, + "num_tokens": 43889572.0, + "step": 18970 + }, + { + "epoch": 0.17401668653158522, + "learning_rate": 0.00016519849637847256, + "loss": 0.8575, + "mean_token_accuracy": 0.742885822057724, + "num_tokens": 43911886.0, + "step": 18980 + }, + { + "epoch": 0.17410837077106445, + "learning_rate": 0.0001651801595305767, + "loss": 0.8632, + "mean_token_accuracy": 0.7443060219287873, + "num_tokens": 43934848.0, + "step": 18990 + }, + { + "epoch": 0.1742000550105437, + "learning_rate": 0.00016516182268268086, + "loss": 0.8399, + "mean_token_accuracy": 0.7461564898490906, + "num_tokens": 43957831.0, + "step": 19000 + }, + { + "epoch": 0.17429173925002292, + "learning_rate": 0.000165143485834785, + "loss": 0.8845, + "mean_token_accuracy": 0.7413355529308319, + "num_tokens": 43981365.0, + "step": 19010 + }, + { + "epoch": 0.17438342348950214, + "learning_rate": 0.00016512514898688917, + "loss": 0.8653, + "mean_token_accuracy": 0.742383724451065, + "num_tokens": 44004122.0, + "step": 19020 + }, + { + "epoch": 0.1744751077289814, + "learning_rate": 0.0001651068121389933, + "loss": 0.833, + "mean_token_accuracy": 0.7481968820095062, + "num_tokens": 44027032.0, + "step": 19030 + }, + { + "epoch": 0.17456679196846062, + "learning_rate": 0.00016508847529109747, + "loss": 0.8588, + "mean_token_accuracy": 0.7434242486953735, + "num_tokens": 44050243.0, + "step": 19040 + }, + { + "epoch": 0.17465847620793987, + "learning_rate": 0.00016507013844320164, + "loss": 0.8354, + "mean_token_accuracy": 0.75514035820961, + "num_tokens": 44073127.0, + "step": 19050 + }, + { + "epoch": 0.1747501604474191, + "learning_rate": 0.00016505180159530577, + "loss": 0.8855, + "mean_token_accuracy": 0.7421274006366729, + "num_tokens": 44095286.0, + "step": 19060 + }, + { + "epoch": 0.1748418446868983, + "learning_rate": 0.00016503346474740994, + "loss": 0.8818, + "mean_token_accuracy": 0.7372287750244141, + "num_tokens": 44118182.0, + "step": 19070 + }, + { + "epoch": 0.17493352892637756, + "learning_rate": 0.00016501512789951408, + "loss": 0.8629, + "mean_token_accuracy": 0.7466937124729156, + "num_tokens": 44141274.0, + "step": 19080 + }, + { + "epoch": 0.17502521316585679, + "learning_rate": 0.00016499679105161822, + "loss": 0.8583, + "mean_token_accuracy": 0.7452625215053559, + "num_tokens": 44164500.0, + "step": 19090 + }, + { + "epoch": 0.17511689740533604, + "learning_rate": 0.0001649784542037224, + "loss": 0.8361, + "mean_token_accuracy": 0.7550947666168213, + "num_tokens": 44187497.0, + "step": 19100 + }, + { + "epoch": 0.17520858164481526, + "learning_rate": 0.00016496011735582655, + "loss": 0.8848, + "mean_token_accuracy": 0.7341136753559112, + "num_tokens": 44210448.0, + "step": 19110 + }, + { + "epoch": 0.17530026588429448, + "learning_rate": 0.0001649417805079307, + "loss": 0.8689, + "mean_token_accuracy": 0.7395574748516083, + "num_tokens": 44234122.0, + "step": 19120 + }, + { + "epoch": 0.17539195012377373, + "learning_rate": 0.00016492344366003485, + "loss": 0.872, + "mean_token_accuracy": 0.7390694618225098, + "num_tokens": 44257673.0, + "step": 19130 + }, + { + "epoch": 0.17548363436325295, + "learning_rate": 0.000164905106812139, + "loss": 0.8429, + "mean_token_accuracy": 0.74883993268013, + "num_tokens": 44281056.0, + "step": 19140 + }, + { + "epoch": 0.17557531860273218, + "learning_rate": 0.00016488676996424315, + "loss": 0.8948, + "mean_token_accuracy": 0.7357378482818604, + "num_tokens": 44303911.0, + "step": 19150 + }, + { + "epoch": 0.17566700284221143, + "learning_rate": 0.0001648684331163473, + "loss": 0.884, + "mean_token_accuracy": 0.7400649547576904, + "num_tokens": 44327654.0, + "step": 19160 + }, + { + "epoch": 0.17575868708169065, + "learning_rate": 0.00016485009626845146, + "loss": 0.901, + "mean_token_accuracy": 0.7337875425815582, + "num_tokens": 44350895.0, + "step": 19170 + }, + { + "epoch": 0.1758503713211699, + "learning_rate": 0.00016483175942055562, + "loss": 0.8898, + "mean_token_accuracy": 0.7370629727840423, + "num_tokens": 44374201.0, + "step": 19180 + }, + { + "epoch": 0.17594205556064912, + "learning_rate": 0.00016481342257265976, + "loss": 0.8717, + "mean_token_accuracy": 0.7427584946155548, + "num_tokens": 44396954.0, + "step": 19190 + }, + { + "epoch": 0.17603373980012835, + "learning_rate": 0.00016479508572476393, + "loss": 0.8361, + "mean_token_accuracy": 0.7497299134731292, + "num_tokens": 44419306.0, + "step": 19200 + }, + { + "epoch": 0.1761254240396076, + "learning_rate": 0.00016477674887686807, + "loss": 0.8891, + "mean_token_accuracy": 0.73868328332901, + "num_tokens": 44442145.0, + "step": 19210 + }, + { + "epoch": 0.17621710827908682, + "learning_rate": 0.00016475841202897223, + "loss": 0.8564, + "mean_token_accuracy": 0.7455623626708985, + "num_tokens": 44465833.0, + "step": 19220 + }, + { + "epoch": 0.17630879251856607, + "learning_rate": 0.00016474007518107637, + "loss": 0.8942, + "mean_token_accuracy": 0.7397753775119782, + "num_tokens": 44488565.0, + "step": 19230 + }, + { + "epoch": 0.1764004767580453, + "learning_rate": 0.00016472173833318053, + "loss": 0.8786, + "mean_token_accuracy": 0.7374221444129944, + "num_tokens": 44512602.0, + "step": 19240 + }, + { + "epoch": 0.17649216099752452, + "learning_rate": 0.0001647034014852847, + "loss": 0.8593, + "mean_token_accuracy": 0.7420086741447449, + "num_tokens": 44535602.0, + "step": 19250 + }, + { + "epoch": 0.17658384523700377, + "learning_rate": 0.00016468506463738884, + "loss": 0.8832, + "mean_token_accuracy": 0.7369343996047973, + "num_tokens": 44558799.0, + "step": 19260 + }, + { + "epoch": 0.176675529476483, + "learning_rate": 0.000164666727789493, + "loss": 0.8477, + "mean_token_accuracy": 0.7505451381206513, + "num_tokens": 44582549.0, + "step": 19270 + }, + { + "epoch": 0.1767672137159622, + "learning_rate": 0.00016464839094159714, + "loss": 0.8617, + "mean_token_accuracy": 0.7434860467910767, + "num_tokens": 44604766.0, + "step": 19280 + }, + { + "epoch": 0.17685889795544146, + "learning_rate": 0.00016463005409370128, + "loss": 0.836, + "mean_token_accuracy": 0.7471416652202606, + "num_tokens": 44627621.0, + "step": 19290 + }, + { + "epoch": 0.17695058219492069, + "learning_rate": 0.00016461171724580547, + "loss": 0.9164, + "mean_token_accuracy": 0.7298359870910645, + "num_tokens": 44650461.0, + "step": 19300 + }, + { + "epoch": 0.17704226643439994, + "learning_rate": 0.0001645933803979096, + "loss": 0.804, + "mean_token_accuracy": 0.7538255751132965, + "num_tokens": 44673964.0, + "step": 19310 + }, + { + "epoch": 0.17713395067387916, + "learning_rate": 0.00016457504355001378, + "loss": 0.862, + "mean_token_accuracy": 0.7465196669101715, + "num_tokens": 44696838.0, + "step": 19320 + }, + { + "epoch": 0.17722563491335838, + "learning_rate": 0.00016455670670211791, + "loss": 0.8774, + "mean_token_accuracy": 0.7344714820384979, + "num_tokens": 44719826.0, + "step": 19330 + }, + { + "epoch": 0.17731731915283763, + "learning_rate": 0.00016453836985422205, + "loss": 0.8914, + "mean_token_accuracy": 0.7317513585090637, + "num_tokens": 44743711.0, + "step": 19340 + }, + { + "epoch": 0.17740900339231686, + "learning_rate": 0.00016452003300632622, + "loss": 0.8777, + "mean_token_accuracy": 0.7445966899394989, + "num_tokens": 44766384.0, + "step": 19350 + }, + { + "epoch": 0.1775006876317961, + "learning_rate": 0.00016450169615843036, + "loss": 0.8465, + "mean_token_accuracy": 0.741133987903595, + "num_tokens": 44790028.0, + "step": 19360 + }, + { + "epoch": 0.17759237187127533, + "learning_rate": 0.00016448335931053452, + "loss": 0.8943, + "mean_token_accuracy": 0.7360158443450928, + "num_tokens": 44812679.0, + "step": 19370 + }, + { + "epoch": 0.17768405611075455, + "learning_rate": 0.0001644650224626387, + "loss": 0.9177, + "mean_token_accuracy": 0.7309502482414245, + "num_tokens": 44835430.0, + "step": 19380 + }, + { + "epoch": 0.1777757403502338, + "learning_rate": 0.00016444668561474283, + "loss": 0.8903, + "mean_token_accuracy": 0.7399446070194244, + "num_tokens": 44858385.0, + "step": 19390 + }, + { + "epoch": 0.17786742458971302, + "learning_rate": 0.000164428348766847, + "loss": 0.8501, + "mean_token_accuracy": 0.7484567940235138, + "num_tokens": 44881181.0, + "step": 19400 + }, + { + "epoch": 0.17795910882919228, + "learning_rate": 0.00016441001191895113, + "loss": 0.8593, + "mean_token_accuracy": 0.7476139545440674, + "num_tokens": 44904429.0, + "step": 19410 + }, + { + "epoch": 0.1780507930686715, + "learning_rate": 0.0001643916750710553, + "loss": 0.8799, + "mean_token_accuracy": 0.7403489708900451, + "num_tokens": 44927631.0, + "step": 19420 + }, + { + "epoch": 0.17814247730815072, + "learning_rate": 0.00016437333822315946, + "loss": 0.8964, + "mean_token_accuracy": 0.732146555185318, + "num_tokens": 44951356.0, + "step": 19430 + }, + { + "epoch": 0.17823416154762997, + "learning_rate": 0.0001643550013752636, + "loss": 0.8373, + "mean_token_accuracy": 0.7548953115940094, + "num_tokens": 44974118.0, + "step": 19440 + }, + { + "epoch": 0.1783258457871092, + "learning_rate": 0.00016433666452736776, + "loss": 0.8719, + "mean_token_accuracy": 0.7457742691040039, + "num_tokens": 44996700.0, + "step": 19450 + }, + { + "epoch": 0.17841753002658842, + "learning_rate": 0.0001643183276794719, + "loss": 0.8561, + "mean_token_accuracy": 0.7452894151210785, + "num_tokens": 45019881.0, + "step": 19460 + }, + { + "epoch": 0.17850921426606767, + "learning_rate": 0.00016429999083157607, + "loss": 0.8159, + "mean_token_accuracy": 0.7612899601459503, + "num_tokens": 45043074.0, + "step": 19470 + }, + { + "epoch": 0.1786008985055469, + "learning_rate": 0.0001642816539836802, + "loss": 0.8534, + "mean_token_accuracy": 0.7475025415420532, + "num_tokens": 45066291.0, + "step": 19480 + }, + { + "epoch": 0.17869258274502614, + "learning_rate": 0.00016426331713578434, + "loss": 0.8666, + "mean_token_accuracy": 0.7391200125217438, + "num_tokens": 45090233.0, + "step": 19490 + }, + { + "epoch": 0.17878426698450536, + "learning_rate": 0.00016424498028788854, + "loss": 0.8746, + "mean_token_accuracy": 0.7415766716003418, + "num_tokens": 45113733.0, + "step": 19500 + }, + { + "epoch": 0.1788759512239846, + "learning_rate": 0.00016422664343999268, + "loss": 0.8629, + "mean_token_accuracy": 0.7435136795043945, + "num_tokens": 45137173.0, + "step": 19510 + }, + { + "epoch": 0.17896763546346384, + "learning_rate": 0.00016420830659209684, + "loss": 0.8473, + "mean_token_accuracy": 0.748375552892685, + "num_tokens": 45159798.0, + "step": 19520 + }, + { + "epoch": 0.17905931970294306, + "learning_rate": 0.00016418996974420098, + "loss": 0.8753, + "mean_token_accuracy": 0.7303220510482789, + "num_tokens": 45183235.0, + "step": 19530 + }, + { + "epoch": 0.1791510039424223, + "learning_rate": 0.00016417163289630512, + "loss": 0.888, + "mean_token_accuracy": 0.7358284950256347, + "num_tokens": 45206108.0, + "step": 19540 + }, + { + "epoch": 0.17924268818190153, + "learning_rate": 0.00016415329604840928, + "loss": 0.8711, + "mean_token_accuracy": 0.7365753650665283, + "num_tokens": 45228871.0, + "step": 19550 + }, + { + "epoch": 0.17933437242138076, + "learning_rate": 0.00016413495920051345, + "loss": 0.8983, + "mean_token_accuracy": 0.7411333501338959, + "num_tokens": 45252530.0, + "step": 19560 + }, + { + "epoch": 0.17942605666086, + "learning_rate": 0.0001641166223526176, + "loss": 0.8737, + "mean_token_accuracy": 0.746991240978241, + "num_tokens": 45276643.0, + "step": 19570 + }, + { + "epoch": 0.17951774090033923, + "learning_rate": 0.00016409828550472175, + "loss": 0.8556, + "mean_token_accuracy": 0.7432246744632721, + "num_tokens": 45299791.0, + "step": 19580 + }, + { + "epoch": 0.17960942513981845, + "learning_rate": 0.0001640799486568259, + "loss": 0.8649, + "mean_token_accuracy": 0.7457501471042634, + "num_tokens": 45323666.0, + "step": 19590 + }, + { + "epoch": 0.1797011093792977, + "learning_rate": 0.00016406161180893006, + "loss": 0.8451, + "mean_token_accuracy": 0.7440292656421661, + "num_tokens": 45347025.0, + "step": 19600 + }, + { + "epoch": 0.17979279361877692, + "learning_rate": 0.0001640432749610342, + "loss": 0.8839, + "mean_token_accuracy": 0.7357450425624847, + "num_tokens": 45369527.0, + "step": 19610 + }, + { + "epoch": 0.17988447785825618, + "learning_rate": 0.00016402493811313836, + "loss": 0.8651, + "mean_token_accuracy": 0.7435458481311799, + "num_tokens": 45392440.0, + "step": 19620 + }, + { + "epoch": 0.1799761620977354, + "learning_rate": 0.00016400660126524253, + "loss": 0.8316, + "mean_token_accuracy": 0.7475884079933166, + "num_tokens": 45416597.0, + "step": 19630 + }, + { + "epoch": 0.18006784633721462, + "learning_rate": 0.00016398826441734666, + "loss": 0.8506, + "mean_token_accuracy": 0.7514847576618194, + "num_tokens": 45439155.0, + "step": 19640 + }, + { + "epoch": 0.18015953057669387, + "learning_rate": 0.00016396992756945083, + "loss": 0.8856, + "mean_token_accuracy": 0.7473500847816468, + "num_tokens": 45461757.0, + "step": 19650 + }, + { + "epoch": 0.1802512148161731, + "learning_rate": 0.00016395159072155497, + "loss": 0.9023, + "mean_token_accuracy": 0.7286785840988159, + "num_tokens": 45484391.0, + "step": 19660 + }, + { + "epoch": 0.18034289905565234, + "learning_rate": 0.00016393325387365913, + "loss": 0.8871, + "mean_token_accuracy": 0.7373834609985351, + "num_tokens": 45507644.0, + "step": 19670 + }, + { + "epoch": 0.18043458329513157, + "learning_rate": 0.00016391491702576327, + "loss": 0.8757, + "mean_token_accuracy": 0.7394998490810394, + "num_tokens": 45530964.0, + "step": 19680 + }, + { + "epoch": 0.1805262675346108, + "learning_rate": 0.00016389658017786744, + "loss": 0.8708, + "mean_token_accuracy": 0.7445003032684326, + "num_tokens": 45554679.0, + "step": 19690 + }, + { + "epoch": 0.18061795177409004, + "learning_rate": 0.0001638782433299716, + "loss": 0.8427, + "mean_token_accuracy": 0.7432986915111541, + "num_tokens": 45577356.0, + "step": 19700 + }, + { + "epoch": 0.18070963601356926, + "learning_rate": 0.00016385990648207574, + "loss": 0.8865, + "mean_token_accuracy": 0.740937077999115, + "num_tokens": 45600553.0, + "step": 19710 + }, + { + "epoch": 0.18080132025304851, + "learning_rate": 0.0001638415696341799, + "loss": 0.8362, + "mean_token_accuracy": 0.7443297207355499, + "num_tokens": 45623672.0, + "step": 19720 + }, + { + "epoch": 0.18089300449252774, + "learning_rate": 0.00016382323278628404, + "loss": 0.8856, + "mean_token_accuracy": 0.7394998967647552, + "num_tokens": 45647220.0, + "step": 19730 + }, + { + "epoch": 0.18098468873200696, + "learning_rate": 0.00016380489593838818, + "loss": 0.8825, + "mean_token_accuracy": 0.7407486975193024, + "num_tokens": 45670407.0, + "step": 19740 + }, + { + "epoch": 0.1810763729714862, + "learning_rate": 0.00016378655909049235, + "loss": 0.8626, + "mean_token_accuracy": 0.7361254632472992, + "num_tokens": 45693934.0, + "step": 19750 + }, + { + "epoch": 0.18116805721096543, + "learning_rate": 0.0001637682222425965, + "loss": 0.8686, + "mean_token_accuracy": 0.7386096835136413, + "num_tokens": 45716903.0, + "step": 19760 + }, + { + "epoch": 0.18125974145044466, + "learning_rate": 0.00016374988539470065, + "loss": 0.8946, + "mean_token_accuracy": 0.7376744985580445, + "num_tokens": 45740340.0, + "step": 19770 + }, + { + "epoch": 0.1813514256899239, + "learning_rate": 0.00016373154854680482, + "loss": 0.8693, + "mean_token_accuracy": 0.7449719130992889, + "num_tokens": 45763197.0, + "step": 19780 + }, + { + "epoch": 0.18144310992940313, + "learning_rate": 0.00016371321169890895, + "loss": 0.8468, + "mean_token_accuracy": 0.7459929168224335, + "num_tokens": 45785869.0, + "step": 19790 + }, + { + "epoch": 0.18153479416888238, + "learning_rate": 0.00016369487485101312, + "loss": 0.8516, + "mean_token_accuracy": 0.7407790124416351, + "num_tokens": 45809432.0, + "step": 19800 + }, + { + "epoch": 0.1816264784083616, + "learning_rate": 0.00016367653800311726, + "loss": 0.8459, + "mean_token_accuracy": 0.744923597574234, + "num_tokens": 45832356.0, + "step": 19810 + }, + { + "epoch": 0.18171816264784083, + "learning_rate": 0.00016365820115522142, + "loss": 0.8828, + "mean_token_accuracy": 0.7451933920383453, + "num_tokens": 45855088.0, + "step": 19820 + }, + { + "epoch": 0.18180984688732008, + "learning_rate": 0.0001636398643073256, + "loss": 0.8364, + "mean_token_accuracy": 0.7445485055446625, + "num_tokens": 45877463.0, + "step": 19830 + }, + { + "epoch": 0.1819015311267993, + "learning_rate": 0.00016362152745942973, + "loss": 0.8548, + "mean_token_accuracy": 0.745529317855835, + "num_tokens": 45900717.0, + "step": 19840 + }, + { + "epoch": 0.18199321536627855, + "learning_rate": 0.0001636031906115339, + "loss": 0.9117, + "mean_token_accuracy": 0.7307271659374237, + "num_tokens": 45924046.0, + "step": 19850 + }, + { + "epoch": 0.18208489960575777, + "learning_rate": 0.00016358485376363803, + "loss": 0.9024, + "mean_token_accuracy": 0.7345387160778045, + "num_tokens": 45946762.0, + "step": 19860 + }, + { + "epoch": 0.182176583845237, + "learning_rate": 0.0001635665169157422, + "loss": 0.8936, + "mean_token_accuracy": 0.736064100265503, + "num_tokens": 45969741.0, + "step": 19870 + }, + { + "epoch": 0.18226826808471625, + "learning_rate": 0.00016354818006784634, + "loss": 0.8923, + "mean_token_accuracy": 0.7301272034645081, + "num_tokens": 45992270.0, + "step": 19880 + }, + { + "epoch": 0.18235995232419547, + "learning_rate": 0.0001635298432199505, + "loss": 0.8584, + "mean_token_accuracy": 0.7410679697990418, + "num_tokens": 46015207.0, + "step": 19890 + }, + { + "epoch": 0.1824516365636747, + "learning_rate": 0.00016351150637205467, + "loss": 0.8307, + "mean_token_accuracy": 0.7555568873882293, + "num_tokens": 46038371.0, + "step": 19900 + }, + { + "epoch": 0.18254332080315394, + "learning_rate": 0.0001634931695241588, + "loss": 0.8631, + "mean_token_accuracy": 0.7425933182239532, + "num_tokens": 46061087.0, + "step": 19910 + }, + { + "epoch": 0.18263500504263316, + "learning_rate": 0.00016347483267626297, + "loss": 0.8616, + "mean_token_accuracy": 0.740113353729248, + "num_tokens": 46084548.0, + "step": 19920 + }, + { + "epoch": 0.18272668928211241, + "learning_rate": 0.0001634564958283671, + "loss": 0.8058, + "mean_token_accuracy": 0.7532809972763062, + "num_tokens": 46107256.0, + "step": 19930 + }, + { + "epoch": 0.18281837352159164, + "learning_rate": 0.00016343815898047125, + "loss": 0.9007, + "mean_token_accuracy": 0.7346232056617736, + "num_tokens": 46130516.0, + "step": 19940 + }, + { + "epoch": 0.18291005776107086, + "learning_rate": 0.00016341982213257544, + "loss": 0.8798, + "mean_token_accuracy": 0.7400797307491302, + "num_tokens": 46154477.0, + "step": 19950 + }, + { + "epoch": 0.1830017420005501, + "learning_rate": 0.00016340148528467958, + "loss": 0.801, + "mean_token_accuracy": 0.7564774513244629, + "num_tokens": 46177456.0, + "step": 19960 + }, + { + "epoch": 0.18309342624002933, + "learning_rate": 0.00016338314843678372, + "loss": 0.8632, + "mean_token_accuracy": 0.7449011743068695, + "num_tokens": 46200615.0, + "step": 19970 + }, + { + "epoch": 0.18318511047950858, + "learning_rate": 0.00016336481158888788, + "loss": 0.8412, + "mean_token_accuracy": 0.7452260315418243, + "num_tokens": 46223213.0, + "step": 19980 + }, + { + "epoch": 0.1832767947189878, + "learning_rate": 0.00016334647474099202, + "loss": 0.8601, + "mean_token_accuracy": 0.746433675289154, + "num_tokens": 46246461.0, + "step": 19990 + }, + { + "epoch": 0.18336847895846703, + "learning_rate": 0.00016332813789309618, + "loss": 0.8602, + "mean_token_accuracy": 0.7386339783668519, + "num_tokens": 46268440.0, + "step": 20000 + }, + { + "epoch": 0.18346016319794628, + "learning_rate": 0.00016330980104520032, + "loss": 0.8636, + "mean_token_accuracy": 0.7404561281204224, + "num_tokens": 46291501.0, + "step": 20010 + }, + { + "epoch": 0.1835518474374255, + "learning_rate": 0.0001632914641973045, + "loss": 0.8874, + "mean_token_accuracy": 0.7369221687316895, + "num_tokens": 46314964.0, + "step": 20020 + }, + { + "epoch": 0.18364353167690475, + "learning_rate": 0.00016327312734940865, + "loss": 0.8651, + "mean_token_accuracy": 0.7409957587718964, + "num_tokens": 46337717.0, + "step": 20030 + }, + { + "epoch": 0.18373521591638398, + "learning_rate": 0.0001632547905015128, + "loss": 0.884, + "mean_token_accuracy": 0.7375479519367218, + "num_tokens": 46360631.0, + "step": 20040 + }, + { + "epoch": 0.1838269001558632, + "learning_rate": 0.00016323645365361696, + "loss": 0.8746, + "mean_token_accuracy": 0.7424764573574066, + "num_tokens": 46384250.0, + "step": 20050 + }, + { + "epoch": 0.18391858439534245, + "learning_rate": 0.0001632181168057211, + "loss": 0.8493, + "mean_token_accuracy": 0.7477382957935333, + "num_tokens": 46407372.0, + "step": 20060 + }, + { + "epoch": 0.18401026863482167, + "learning_rate": 0.00016319977995782526, + "loss": 0.8902, + "mean_token_accuracy": 0.7340875267982483, + "num_tokens": 46430793.0, + "step": 20070 + }, + { + "epoch": 0.1841019528743009, + "learning_rate": 0.00016318144310992943, + "loss": 0.8558, + "mean_token_accuracy": 0.7367632687091827, + "num_tokens": 46452956.0, + "step": 20080 + }, + { + "epoch": 0.18419363711378015, + "learning_rate": 0.00016316310626203357, + "loss": 0.9275, + "mean_token_accuracy": 0.7276939272880554, + "num_tokens": 46476194.0, + "step": 20090 + }, + { + "epoch": 0.18428532135325937, + "learning_rate": 0.00016314476941413773, + "loss": 0.8635, + "mean_token_accuracy": 0.7420652866363525, + "num_tokens": 46500028.0, + "step": 20100 + }, + { + "epoch": 0.18437700559273862, + "learning_rate": 0.00016312643256624187, + "loss": 0.8622, + "mean_token_accuracy": 0.7478643298149109, + "num_tokens": 46522328.0, + "step": 20110 + }, + { + "epoch": 0.18446868983221784, + "learning_rate": 0.00016310809571834603, + "loss": 0.9022, + "mean_token_accuracy": 0.739221578836441, + "num_tokens": 46544781.0, + "step": 20120 + }, + { + "epoch": 0.18456037407169706, + "learning_rate": 0.00016308975887045017, + "loss": 0.8737, + "mean_token_accuracy": 0.7402739584445953, + "num_tokens": 46567167.0, + "step": 20130 + }, + { + "epoch": 0.18465205831117631, + "learning_rate": 0.0001630714220225543, + "loss": 0.8891, + "mean_token_accuracy": 0.7409417510032654, + "num_tokens": 46590490.0, + "step": 20140 + }, + { + "epoch": 0.18474374255065554, + "learning_rate": 0.0001630530851746585, + "loss": 0.8535, + "mean_token_accuracy": 0.7470172762870788, + "num_tokens": 46613515.0, + "step": 20150 + }, + { + "epoch": 0.1848354267901348, + "learning_rate": 0.00016303474832676264, + "loss": 0.8709, + "mean_token_accuracy": 0.7364602446556091, + "num_tokens": 46636624.0, + "step": 20160 + }, + { + "epoch": 0.184927111029614, + "learning_rate": 0.00016301641147886678, + "loss": 0.8492, + "mean_token_accuracy": 0.7441396534442901, + "num_tokens": 46659294.0, + "step": 20170 + }, + { + "epoch": 0.18501879526909323, + "learning_rate": 0.00016299807463097095, + "loss": 0.8375, + "mean_token_accuracy": 0.751100218296051, + "num_tokens": 46682558.0, + "step": 20180 + }, + { + "epoch": 0.18511047950857248, + "learning_rate": 0.00016297973778307508, + "loss": 0.8435, + "mean_token_accuracy": 0.7442737102508545, + "num_tokens": 46706272.0, + "step": 20190 + }, + { + "epoch": 0.1852021637480517, + "learning_rate": 0.00016296140093517925, + "loss": 0.8606, + "mean_token_accuracy": 0.7447192013263703, + "num_tokens": 46729004.0, + "step": 20200 + }, + { + "epoch": 0.18529384798753093, + "learning_rate": 0.00016294306408728341, + "loss": 0.8893, + "mean_token_accuracy": 0.737049913406372, + "num_tokens": 46751920.0, + "step": 20210 + }, + { + "epoch": 0.18538553222701018, + "learning_rate": 0.00016292472723938755, + "loss": 0.8351, + "mean_token_accuracy": 0.7449952661991119, + "num_tokens": 46775591.0, + "step": 20220 + }, + { + "epoch": 0.1854772164664894, + "learning_rate": 0.00016290639039149172, + "loss": 0.8686, + "mean_token_accuracy": 0.7429184257984162, + "num_tokens": 46799177.0, + "step": 20230 + }, + { + "epoch": 0.18556890070596865, + "learning_rate": 0.00016288805354359586, + "loss": 0.8657, + "mean_token_accuracy": 0.7441246688365937, + "num_tokens": 46822170.0, + "step": 20240 + }, + { + "epoch": 0.18566058494544788, + "learning_rate": 0.00016286971669570002, + "loss": 0.8754, + "mean_token_accuracy": 0.741225790977478, + "num_tokens": 46845590.0, + "step": 20250 + }, + { + "epoch": 0.1857522691849271, + "learning_rate": 0.00016285137984780416, + "loss": 0.8961, + "mean_token_accuracy": 0.739786970615387, + "num_tokens": 46868713.0, + "step": 20260 + }, + { + "epoch": 0.18584395342440635, + "learning_rate": 0.00016283304299990833, + "loss": 0.8766, + "mean_token_accuracy": 0.7376769185066223, + "num_tokens": 46891875.0, + "step": 20270 + }, + { + "epoch": 0.18593563766388557, + "learning_rate": 0.0001628147061520125, + "loss": 0.8516, + "mean_token_accuracy": 0.7486691176891327, + "num_tokens": 46915159.0, + "step": 20280 + }, + { + "epoch": 0.18602732190336482, + "learning_rate": 0.00016279636930411663, + "loss": 0.8967, + "mean_token_accuracy": 0.737358820438385, + "num_tokens": 46937783.0, + "step": 20290 + }, + { + "epoch": 0.18611900614284405, + "learning_rate": 0.0001627780324562208, + "loss": 0.8698, + "mean_token_accuracy": 0.7393028676509857, + "num_tokens": 46960877.0, + "step": 20300 + }, + { + "epoch": 0.18621069038232327, + "learning_rate": 0.00016275969560832493, + "loss": 0.8501, + "mean_token_accuracy": 0.7443229734897614, + "num_tokens": 46984237.0, + "step": 20310 + }, + { + "epoch": 0.18630237462180252, + "learning_rate": 0.0001627413587604291, + "loss": 0.8692, + "mean_token_accuracy": 0.7384073853492736, + "num_tokens": 47007071.0, + "step": 20320 + }, + { + "epoch": 0.18639405886128174, + "learning_rate": 0.00016272302191253324, + "loss": 0.8642, + "mean_token_accuracy": 0.7440657258033753, + "num_tokens": 47030529.0, + "step": 20330 + }, + { + "epoch": 0.186485743100761, + "learning_rate": 0.0001627046850646374, + "loss": 0.8998, + "mean_token_accuracy": 0.7337565958499909, + "num_tokens": 47054139.0, + "step": 20340 + }, + { + "epoch": 0.18657742734024022, + "learning_rate": 0.00016268634821674157, + "loss": 0.9173, + "mean_token_accuracy": 0.7255724966526031, + "num_tokens": 47077431.0, + "step": 20350 + }, + { + "epoch": 0.18666911157971944, + "learning_rate": 0.0001626680113688457, + "loss": 0.8224, + "mean_token_accuracy": 0.7518046200275421, + "num_tokens": 47100193.0, + "step": 20360 + }, + { + "epoch": 0.1867607958191987, + "learning_rate": 0.00016264967452094984, + "loss": 0.8833, + "mean_token_accuracy": 0.7428637504577636, + "num_tokens": 47123625.0, + "step": 20370 + }, + { + "epoch": 0.1868524800586779, + "learning_rate": 0.000162631337673054, + "loss": 0.8519, + "mean_token_accuracy": 0.742831003665924, + "num_tokens": 47146914.0, + "step": 20380 + }, + { + "epoch": 0.18694416429815713, + "learning_rate": 0.00016261300082515815, + "loss": 0.8822, + "mean_token_accuracy": 0.7372194111347199, + "num_tokens": 47170484.0, + "step": 20390 + }, + { + "epoch": 0.18703584853763638, + "learning_rate": 0.00016259466397726231, + "loss": 0.8827, + "mean_token_accuracy": 0.7353140771389007, + "num_tokens": 47193430.0, + "step": 20400 + }, + { + "epoch": 0.1871275327771156, + "learning_rate": 0.00016257632712936648, + "loss": 0.8743, + "mean_token_accuracy": 0.7365429759025574, + "num_tokens": 47216740.0, + "step": 20410 + }, + { + "epoch": 0.18721921701659486, + "learning_rate": 0.00016255799028147062, + "loss": 0.8508, + "mean_token_accuracy": 0.7402590930461883, + "num_tokens": 47239893.0, + "step": 20420 + }, + { + "epoch": 0.18731090125607408, + "learning_rate": 0.00016253965343357478, + "loss": 0.8506, + "mean_token_accuracy": 0.7422642886638642, + "num_tokens": 47262839.0, + "step": 20430 + }, + { + "epoch": 0.1874025854955533, + "learning_rate": 0.00016252131658567892, + "loss": 0.9027, + "mean_token_accuracy": 0.7306043088436127, + "num_tokens": 47285612.0, + "step": 20440 + }, + { + "epoch": 0.18749426973503255, + "learning_rate": 0.0001625029797377831, + "loss": 0.8818, + "mean_token_accuracy": 0.7351073741912841, + "num_tokens": 47308929.0, + "step": 20450 + }, + { + "epoch": 0.18758595397451178, + "learning_rate": 0.00016248464288988722, + "loss": 0.8744, + "mean_token_accuracy": 0.7398530781269074, + "num_tokens": 47332396.0, + "step": 20460 + }, + { + "epoch": 0.18767763821399103, + "learning_rate": 0.0001624663060419914, + "loss": 0.8563, + "mean_token_accuracy": 0.7346394240856171, + "num_tokens": 47356014.0, + "step": 20470 + }, + { + "epoch": 0.18776932245347025, + "learning_rate": 0.00016244796919409556, + "loss": 0.8702, + "mean_token_accuracy": 0.7430578410625458, + "num_tokens": 47378518.0, + "step": 20480 + }, + { + "epoch": 0.18786100669294947, + "learning_rate": 0.0001624296323461997, + "loss": 0.8456, + "mean_token_accuracy": 0.7519625306129456, + "num_tokens": 47401956.0, + "step": 20490 + }, + { + "epoch": 0.18795269093242872, + "learning_rate": 0.00016241129549830386, + "loss": 0.8634, + "mean_token_accuracy": 0.7472677826881409, + "num_tokens": 47424377.0, + "step": 20500 + }, + { + "epoch": 0.18804437517190795, + "learning_rate": 0.000162392958650408, + "loss": 0.8654, + "mean_token_accuracy": 0.7401869833469391, + "num_tokens": 47446951.0, + "step": 20510 + }, + { + "epoch": 0.18813605941138717, + "learning_rate": 0.00016237462180251216, + "loss": 0.8847, + "mean_token_accuracy": 0.739195829629898, + "num_tokens": 47469323.0, + "step": 20520 + }, + { + "epoch": 0.18822774365086642, + "learning_rate": 0.0001623562849546163, + "loss": 0.8405, + "mean_token_accuracy": 0.7473972558975219, + "num_tokens": 47492517.0, + "step": 20530 + }, + { + "epoch": 0.18831942789034564, + "learning_rate": 0.00016233794810672047, + "loss": 0.8452, + "mean_token_accuracy": 0.7496969938278198, + "num_tokens": 47515625.0, + "step": 20540 + }, + { + "epoch": 0.1884111121298249, + "learning_rate": 0.00016231961125882463, + "loss": 0.874, + "mean_token_accuracy": 0.7391631364822387, + "num_tokens": 47538126.0, + "step": 20550 + }, + { + "epoch": 0.18850279636930412, + "learning_rate": 0.00016230127441092877, + "loss": 0.8279, + "mean_token_accuracy": 0.7459759950637818, + "num_tokens": 47560266.0, + "step": 20560 + }, + { + "epoch": 0.18859448060878334, + "learning_rate": 0.0001622829375630329, + "loss": 0.8903, + "mean_token_accuracy": 0.7351974725723267, + "num_tokens": 47583398.0, + "step": 20570 + }, + { + "epoch": 0.1886861648482626, + "learning_rate": 0.00016226460071513707, + "loss": 0.8355, + "mean_token_accuracy": 0.7493352830410004, + "num_tokens": 47606618.0, + "step": 20580 + }, + { + "epoch": 0.1887778490877418, + "learning_rate": 0.0001622462638672412, + "loss": 0.8783, + "mean_token_accuracy": 0.7386853516101837, + "num_tokens": 47629504.0, + "step": 20590 + }, + { + "epoch": 0.18886953332722106, + "learning_rate": 0.00016222792701934538, + "loss": 0.8638, + "mean_token_accuracy": 0.7422787070274353, + "num_tokens": 47652234.0, + "step": 20600 + }, + { + "epoch": 0.18896121756670028, + "learning_rate": 0.00016220959017144954, + "loss": 0.9119, + "mean_token_accuracy": 0.7353614032268524, + "num_tokens": 47675685.0, + "step": 20610 + }, + { + "epoch": 0.1890529018061795, + "learning_rate": 0.00016219125332355368, + "loss": 0.8815, + "mean_token_accuracy": 0.7416007101535798, + "num_tokens": 47698240.0, + "step": 20620 + }, + { + "epoch": 0.18914458604565876, + "learning_rate": 0.00016217291647565785, + "loss": 0.8834, + "mean_token_accuracy": 0.7420873403549194, + "num_tokens": 47722415.0, + "step": 20630 + }, + { + "epoch": 0.18923627028513798, + "learning_rate": 0.00016215457962776199, + "loss": 0.8507, + "mean_token_accuracy": 0.7479335606098175, + "num_tokens": 47745210.0, + "step": 20640 + }, + { + "epoch": 0.18932795452461723, + "learning_rate": 0.00016213624277986615, + "loss": 0.8028, + "mean_token_accuracy": 0.7593098104000091, + "num_tokens": 47768717.0, + "step": 20650 + }, + { + "epoch": 0.18941963876409645, + "learning_rate": 0.0001621179059319703, + "loss": 0.8568, + "mean_token_accuracy": 0.7413754463195801, + "num_tokens": 47791806.0, + "step": 20660 + }, + { + "epoch": 0.18951132300357568, + "learning_rate": 0.00016209956908407445, + "loss": 0.8905, + "mean_token_accuracy": 0.7388002455234528, + "num_tokens": 47814623.0, + "step": 20670 + }, + { + "epoch": 0.18960300724305493, + "learning_rate": 0.00016208123223617862, + "loss": 0.897, + "mean_token_accuracy": 0.7394916534423828, + "num_tokens": 47837359.0, + "step": 20680 + }, + { + "epoch": 0.18969469148253415, + "learning_rate": 0.00016206289538828276, + "loss": 0.8884, + "mean_token_accuracy": 0.7370145142078399, + "num_tokens": 47860716.0, + "step": 20690 + }, + { + "epoch": 0.18978637572201337, + "learning_rate": 0.00016204455854038692, + "loss": 0.8339, + "mean_token_accuracy": 0.7474730551242829, + "num_tokens": 47883540.0, + "step": 20700 + }, + { + "epoch": 0.18987805996149262, + "learning_rate": 0.00016202622169249106, + "loss": 0.8427, + "mean_token_accuracy": 0.7456452190876007, + "num_tokens": 47905850.0, + "step": 20710 + }, + { + "epoch": 0.18996974420097185, + "learning_rate": 0.00016200788484459523, + "loss": 0.8965, + "mean_token_accuracy": 0.7329223453998566, + "num_tokens": 47928676.0, + "step": 20720 + }, + { + "epoch": 0.1900614284404511, + "learning_rate": 0.00016198954799669937, + "loss": 0.8594, + "mean_token_accuracy": 0.7428911566734314, + "num_tokens": 47951913.0, + "step": 20730 + }, + { + "epoch": 0.19015311267993032, + "learning_rate": 0.00016197121114880353, + "loss": 0.9172, + "mean_token_accuracy": 0.7258612811565399, + "num_tokens": 47974742.0, + "step": 20740 + }, + { + "epoch": 0.19024479691940954, + "learning_rate": 0.0001619528743009077, + "loss": 0.8565, + "mean_token_accuracy": 0.7507954895496368, + "num_tokens": 47997674.0, + "step": 20750 + }, + { + "epoch": 0.1903364811588888, + "learning_rate": 0.00016193453745301184, + "loss": 0.8899, + "mean_token_accuracy": 0.741180008649826, + "num_tokens": 48019409.0, + "step": 20760 + }, + { + "epoch": 0.19042816539836802, + "learning_rate": 0.00016191620060511597, + "loss": 0.8598, + "mean_token_accuracy": 0.7505606949329376, + "num_tokens": 48042169.0, + "step": 20770 + }, + { + "epoch": 0.19051984963784727, + "learning_rate": 0.00016189786375722014, + "loss": 0.8657, + "mean_token_accuracy": 0.7380756914615632, + "num_tokens": 48065218.0, + "step": 20780 + }, + { + "epoch": 0.1906115338773265, + "learning_rate": 0.00016187952690932428, + "loss": 0.861, + "mean_token_accuracy": 0.7432824075222015, + "num_tokens": 48087671.0, + "step": 20790 + }, + { + "epoch": 0.1907032181168057, + "learning_rate": 0.00016186119006142847, + "loss": 0.8334, + "mean_token_accuracy": 0.7480520606040955, + "num_tokens": 48110601.0, + "step": 20800 + }, + { + "epoch": 0.19079490235628496, + "learning_rate": 0.0001618428532135326, + "loss": 0.8634, + "mean_token_accuracy": 0.7470580756664276, + "num_tokens": 48134187.0, + "step": 20810 + }, + { + "epoch": 0.19088658659576418, + "learning_rate": 0.00016182451636563675, + "loss": 0.8579, + "mean_token_accuracy": 0.7445999026298523, + "num_tokens": 48156688.0, + "step": 20820 + }, + { + "epoch": 0.19097827083524344, + "learning_rate": 0.0001618061795177409, + "loss": 0.864, + "mean_token_accuracy": 0.7393371820449829, + "num_tokens": 48179961.0, + "step": 20830 + }, + { + "epoch": 0.19106995507472266, + "learning_rate": 0.00016178784266984505, + "loss": 0.8817, + "mean_token_accuracy": 0.7396546721458435, + "num_tokens": 48203535.0, + "step": 20840 + }, + { + "epoch": 0.19116163931420188, + "learning_rate": 0.00016176950582194922, + "loss": 0.8593, + "mean_token_accuracy": 0.7402848124504089, + "num_tokens": 48227238.0, + "step": 20850 + }, + { + "epoch": 0.19125332355368113, + "learning_rate": 0.00016175116897405335, + "loss": 0.8888, + "mean_token_accuracy": 0.7421349585056305, + "num_tokens": 48250790.0, + "step": 20860 + }, + { + "epoch": 0.19134500779316035, + "learning_rate": 0.00016173283212615752, + "loss": 0.8508, + "mean_token_accuracy": 0.740914386510849, + "num_tokens": 48273532.0, + "step": 20870 + }, + { + "epoch": 0.19143669203263958, + "learning_rate": 0.00016171449527826168, + "loss": 0.8841, + "mean_token_accuracy": 0.7401702165603637, + "num_tokens": 48296239.0, + "step": 20880 + }, + { + "epoch": 0.19152837627211883, + "learning_rate": 0.00016169615843036582, + "loss": 0.8734, + "mean_token_accuracy": 0.7406877756118775, + "num_tokens": 48319770.0, + "step": 20890 + }, + { + "epoch": 0.19162006051159805, + "learning_rate": 0.00016167782158247, + "loss": 0.8508, + "mean_token_accuracy": 0.7431667506694793, + "num_tokens": 48342994.0, + "step": 20900 + }, + { + "epoch": 0.1917117447510773, + "learning_rate": 0.00016165948473457413, + "loss": 0.8728, + "mean_token_accuracy": 0.743863171339035, + "num_tokens": 48366530.0, + "step": 20910 + }, + { + "epoch": 0.19180342899055652, + "learning_rate": 0.0001616411478866783, + "loss": 0.8555, + "mean_token_accuracy": 0.7453465580940246, + "num_tokens": 48390329.0, + "step": 20920 + }, + { + "epoch": 0.19189511323003575, + "learning_rate": 0.00016162281103878246, + "loss": 0.8696, + "mean_token_accuracy": 0.7463473320007324, + "num_tokens": 48414045.0, + "step": 20930 + }, + { + "epoch": 0.191986797469515, + "learning_rate": 0.0001616044741908866, + "loss": 0.8403, + "mean_token_accuracy": 0.7469229459762573, + "num_tokens": 48437275.0, + "step": 20940 + }, + { + "epoch": 0.19207848170899422, + "learning_rate": 0.00016158613734299076, + "loss": 0.8809, + "mean_token_accuracy": 0.739329582452774, + "num_tokens": 48460011.0, + "step": 20950 + }, + { + "epoch": 0.19217016594847347, + "learning_rate": 0.0001615678004950949, + "loss": 0.8458, + "mean_token_accuracy": 0.7448213636875153, + "num_tokens": 48482742.0, + "step": 20960 + }, + { + "epoch": 0.1922618501879527, + "learning_rate": 0.00016154946364719904, + "loss": 0.8266, + "mean_token_accuracy": 0.7491724967956543, + "num_tokens": 48506138.0, + "step": 20970 + }, + { + "epoch": 0.19235353442743192, + "learning_rate": 0.0001615311267993032, + "loss": 0.8624, + "mean_token_accuracy": 0.7481300830841064, + "num_tokens": 48529314.0, + "step": 20980 + }, + { + "epoch": 0.19244521866691117, + "learning_rate": 0.00016151278995140734, + "loss": 0.8375, + "mean_token_accuracy": 0.7472502052783966, + "num_tokens": 48552194.0, + "step": 20990 + }, + { + "epoch": 0.1925369029063904, + "learning_rate": 0.00016149445310351153, + "loss": 0.8443, + "mean_token_accuracy": 0.7430356681346894, + "num_tokens": 48575035.0, + "step": 21000 + }, + { + "epoch": 0.1926285871458696, + "learning_rate": 0.00016147611625561567, + "loss": 0.857, + "mean_token_accuracy": 0.7412232458591461, + "num_tokens": 48597752.0, + "step": 21010 + }, + { + "epoch": 0.19272027138534886, + "learning_rate": 0.0001614577794077198, + "loss": 0.8431, + "mean_token_accuracy": 0.7491430640220642, + "num_tokens": 48620978.0, + "step": 21020 + }, + { + "epoch": 0.19281195562482809, + "learning_rate": 0.00016143944255982398, + "loss": 0.8545, + "mean_token_accuracy": 0.7437418103218079, + "num_tokens": 48643813.0, + "step": 21030 + }, + { + "epoch": 0.19290363986430734, + "learning_rate": 0.00016142110571192811, + "loss": 0.8528, + "mean_token_accuracy": 0.7407807052135468, + "num_tokens": 48666585.0, + "step": 21040 + }, + { + "epoch": 0.19299532410378656, + "learning_rate": 0.00016140276886403228, + "loss": 0.8069, + "mean_token_accuracy": 0.753812450170517, + "num_tokens": 48689187.0, + "step": 21050 + }, + { + "epoch": 0.19308700834326578, + "learning_rate": 0.00016138443201613645, + "loss": 0.8609, + "mean_token_accuracy": 0.7366057932376862, + "num_tokens": 48712961.0, + "step": 21060 + }, + { + "epoch": 0.19317869258274503, + "learning_rate": 0.00016136609516824058, + "loss": 0.8319, + "mean_token_accuracy": 0.7512231767177582, + "num_tokens": 48735786.0, + "step": 21070 + }, + { + "epoch": 0.19327037682222425, + "learning_rate": 0.00016134775832034475, + "loss": 0.8723, + "mean_token_accuracy": 0.7407830059528351, + "num_tokens": 48759045.0, + "step": 21080 + }, + { + "epoch": 0.1933620610617035, + "learning_rate": 0.0001613294214724489, + "loss": 0.8911, + "mean_token_accuracy": 0.7348986148834229, + "num_tokens": 48781924.0, + "step": 21090 + }, + { + "epoch": 0.19345374530118273, + "learning_rate": 0.00016131108462455305, + "loss": 0.8808, + "mean_token_accuracy": 0.7405512809753418, + "num_tokens": 48805482.0, + "step": 21100 + }, + { + "epoch": 0.19354542954066195, + "learning_rate": 0.0001612927477766572, + "loss": 0.891, + "mean_token_accuracy": 0.7435926377773285, + "num_tokens": 48828544.0, + "step": 21110 + }, + { + "epoch": 0.1936371137801412, + "learning_rate": 0.00016127441092876136, + "loss": 0.8516, + "mean_token_accuracy": 0.7438839197158813, + "num_tokens": 48851860.0, + "step": 21120 + }, + { + "epoch": 0.19372879801962042, + "learning_rate": 0.00016125607408086552, + "loss": 0.8439, + "mean_token_accuracy": 0.7518651962280274, + "num_tokens": 48875109.0, + "step": 21130 + }, + { + "epoch": 0.19382048225909967, + "learning_rate": 0.00016123773723296966, + "loss": 0.8441, + "mean_token_accuracy": 0.740175086259842, + "num_tokens": 48897684.0, + "step": 21140 + }, + { + "epoch": 0.1939121664985789, + "learning_rate": 0.00016121940038507383, + "loss": 0.8888, + "mean_token_accuracy": 0.7309944331645966, + "num_tokens": 48920214.0, + "step": 21150 + }, + { + "epoch": 0.19400385073805812, + "learning_rate": 0.00016120106353717796, + "loss": 0.8848, + "mean_token_accuracy": 0.7339881181716919, + "num_tokens": 48943709.0, + "step": 21160 + }, + { + "epoch": 0.19409553497753737, + "learning_rate": 0.0001611827266892821, + "loss": 0.8611, + "mean_token_accuracy": 0.7382303059101105, + "num_tokens": 48966728.0, + "step": 21170 + }, + { + "epoch": 0.1941872192170166, + "learning_rate": 0.00016116438984138627, + "loss": 0.8668, + "mean_token_accuracy": 0.7442708969116211, + "num_tokens": 48990006.0, + "step": 21180 + }, + { + "epoch": 0.19427890345649582, + "learning_rate": 0.00016114605299349043, + "loss": 0.8585, + "mean_token_accuracy": 0.7375147223472596, + "num_tokens": 49013324.0, + "step": 21190 + }, + { + "epoch": 0.19437058769597507, + "learning_rate": 0.0001611277161455946, + "loss": 0.8542, + "mean_token_accuracy": 0.7424695074558259, + "num_tokens": 49036876.0, + "step": 21200 + }, + { + "epoch": 0.1944622719354543, + "learning_rate": 0.00016110937929769874, + "loss": 0.876, + "mean_token_accuracy": 0.733031016588211, + "num_tokens": 49059836.0, + "step": 21210 + }, + { + "epoch": 0.19455395617493354, + "learning_rate": 0.00016109104244980288, + "loss": 0.8763, + "mean_token_accuracy": 0.7428466975688934, + "num_tokens": 49083313.0, + "step": 21220 + }, + { + "epoch": 0.19464564041441276, + "learning_rate": 0.00016107270560190704, + "loss": 0.8664, + "mean_token_accuracy": 0.7427617132663726, + "num_tokens": 49106201.0, + "step": 21230 + }, + { + "epoch": 0.19473732465389199, + "learning_rate": 0.00016105436875401118, + "loss": 0.839, + "mean_token_accuracy": 0.7424100399017334, + "num_tokens": 49129637.0, + "step": 21240 + }, + { + "epoch": 0.19482900889337124, + "learning_rate": 0.00016103603190611534, + "loss": 0.843, + "mean_token_accuracy": 0.7467679858207703, + "num_tokens": 49152603.0, + "step": 21250 + }, + { + "epoch": 0.19492069313285046, + "learning_rate": 0.0001610176950582195, + "loss": 0.8612, + "mean_token_accuracy": 0.7400746285915375, + "num_tokens": 49176624.0, + "step": 21260 + }, + { + "epoch": 0.1950123773723297, + "learning_rate": 0.00016099935821032365, + "loss": 0.8615, + "mean_token_accuracy": 0.7443634688854217, + "num_tokens": 49200284.0, + "step": 21270 + }, + { + "epoch": 0.19510406161180893, + "learning_rate": 0.00016098102136242781, + "loss": 0.8775, + "mean_token_accuracy": 0.7443433940410614, + "num_tokens": 49223346.0, + "step": 21280 + }, + { + "epoch": 0.19519574585128815, + "learning_rate": 0.00016096268451453195, + "loss": 0.8679, + "mean_token_accuracy": 0.7394611775875092, + "num_tokens": 49246308.0, + "step": 21290 + }, + { + "epoch": 0.1952874300907674, + "learning_rate": 0.00016094434766663612, + "loss": 0.8845, + "mean_token_accuracy": 0.7369400084018707, + "num_tokens": 49269531.0, + "step": 21300 + }, + { + "epoch": 0.19537911433024663, + "learning_rate": 0.00016092601081874026, + "loss": 0.8431, + "mean_token_accuracy": 0.7498523473739624, + "num_tokens": 49292741.0, + "step": 21310 + }, + { + "epoch": 0.19547079856972585, + "learning_rate": 0.00016090767397084442, + "loss": 0.923, + "mean_token_accuracy": 0.7297579348087311, + "num_tokens": 49315473.0, + "step": 21320 + }, + { + "epoch": 0.1955624828092051, + "learning_rate": 0.0001608893371229486, + "loss": 0.8284, + "mean_token_accuracy": 0.7490214943885803, + "num_tokens": 49338023.0, + "step": 21330 + }, + { + "epoch": 0.19565416704868432, + "learning_rate": 0.00016087100027505272, + "loss": 0.8693, + "mean_token_accuracy": 0.740743488073349, + "num_tokens": 49360660.0, + "step": 21340 + }, + { + "epoch": 0.19574585128816357, + "learning_rate": 0.0001608526634271569, + "loss": 0.8527, + "mean_token_accuracy": 0.7407018840312958, + "num_tokens": 49384019.0, + "step": 21350 + }, + { + "epoch": 0.1958375355276428, + "learning_rate": 0.00016083432657926103, + "loss": 0.8638, + "mean_token_accuracy": 0.7416827857494355, + "num_tokens": 49407251.0, + "step": 21360 + }, + { + "epoch": 0.19592921976712202, + "learning_rate": 0.00016081598973136517, + "loss": 0.8749, + "mean_token_accuracy": 0.7415823817253113, + "num_tokens": 49431233.0, + "step": 21370 + }, + { + "epoch": 0.19602090400660127, + "learning_rate": 0.00016079765288346933, + "loss": 0.8675, + "mean_token_accuracy": 0.7362518429756164, + "num_tokens": 49453887.0, + "step": 21380 + }, + { + "epoch": 0.1961125882460805, + "learning_rate": 0.0001607793160355735, + "loss": 0.8628, + "mean_token_accuracy": 0.7395012438297272, + "num_tokens": 49476830.0, + "step": 21390 + }, + { + "epoch": 0.19620427248555974, + "learning_rate": 0.00016076097918767766, + "loss": 0.887, + "mean_token_accuracy": 0.7354326903820038, + "num_tokens": 49500141.0, + "step": 21400 + }, + { + "epoch": 0.19629595672503897, + "learning_rate": 0.0001607426423397818, + "loss": 0.8573, + "mean_token_accuracy": 0.7437665939331055, + "num_tokens": 49524576.0, + "step": 21410 + }, + { + "epoch": 0.1963876409645182, + "learning_rate": 0.00016072430549188594, + "loss": 0.8615, + "mean_token_accuracy": 0.7397708415985107, + "num_tokens": 49547077.0, + "step": 21420 + }, + { + "epoch": 0.19647932520399744, + "learning_rate": 0.0001607059686439901, + "loss": 0.8711, + "mean_token_accuracy": 0.7386774241924285, + "num_tokens": 49569078.0, + "step": 21430 + }, + { + "epoch": 0.19657100944347666, + "learning_rate": 0.00016068763179609424, + "loss": 0.8996, + "mean_token_accuracy": 0.7338386654853821, + "num_tokens": 49591194.0, + "step": 21440 + }, + { + "epoch": 0.1966626936829559, + "learning_rate": 0.00016066929494819844, + "loss": 0.887, + "mean_token_accuracy": 0.7388228833675384, + "num_tokens": 49614734.0, + "step": 21450 + }, + { + "epoch": 0.19675437792243514, + "learning_rate": 0.00016065095810030257, + "loss": 0.8207, + "mean_token_accuracy": 0.7569953620433807, + "num_tokens": 49637603.0, + "step": 21460 + }, + { + "epoch": 0.19684606216191436, + "learning_rate": 0.0001606326212524067, + "loss": 0.8467, + "mean_token_accuracy": 0.7382251560688019, + "num_tokens": 49660518.0, + "step": 21470 + }, + { + "epoch": 0.1969377464013936, + "learning_rate": 0.00016061428440451088, + "loss": 0.917, + "mean_token_accuracy": 0.7341851830482483, + "num_tokens": 49683704.0, + "step": 21480 + }, + { + "epoch": 0.19702943064087283, + "learning_rate": 0.00016059594755661502, + "loss": 0.8925, + "mean_token_accuracy": 0.7335306823253631, + "num_tokens": 49707128.0, + "step": 21490 + }, + { + "epoch": 0.19712111488035206, + "learning_rate": 0.00016057761070871918, + "loss": 0.8705, + "mean_token_accuracy": 0.7388100624084473, + "num_tokens": 49730635.0, + "step": 21500 + }, + { + "epoch": 0.1972127991198313, + "learning_rate": 0.00016055927386082332, + "loss": 0.8486, + "mean_token_accuracy": 0.7437248170375824, + "num_tokens": 49753763.0, + "step": 21510 + }, + { + "epoch": 0.19730448335931053, + "learning_rate": 0.00016054093701292749, + "loss": 0.8649, + "mean_token_accuracy": 0.7463112950325013, + "num_tokens": 49777325.0, + "step": 21520 + }, + { + "epoch": 0.19739616759878978, + "learning_rate": 0.00016052260016503165, + "loss": 0.8478, + "mean_token_accuracy": 0.7517745077610016, + "num_tokens": 49799946.0, + "step": 21530 + }, + { + "epoch": 0.197487851838269, + "learning_rate": 0.0001605042633171358, + "loss": 0.8317, + "mean_token_accuracy": 0.7430775046348572, + "num_tokens": 49823209.0, + "step": 21540 + }, + { + "epoch": 0.19757953607774822, + "learning_rate": 0.00016048592646923995, + "loss": 0.8909, + "mean_token_accuracy": 0.7399197399616242, + "num_tokens": 49846491.0, + "step": 21550 + }, + { + "epoch": 0.19767122031722748, + "learning_rate": 0.0001604675896213441, + "loss": 0.8296, + "mean_token_accuracy": 0.7475386679172515, + "num_tokens": 49869883.0, + "step": 21560 + }, + { + "epoch": 0.1977629045567067, + "learning_rate": 0.00016044925277344823, + "loss": 0.8906, + "mean_token_accuracy": 0.7356217682361603, + "num_tokens": 49893339.0, + "step": 21570 + }, + { + "epoch": 0.19785458879618595, + "learning_rate": 0.0001604309159255524, + "loss": 0.8393, + "mean_token_accuracy": 0.7522357940673828, + "num_tokens": 49915948.0, + "step": 21580 + }, + { + "epoch": 0.19794627303566517, + "learning_rate": 0.00016041257907765656, + "loss": 0.8696, + "mean_token_accuracy": 0.7433183133602143, + "num_tokens": 49939441.0, + "step": 21590 + }, + { + "epoch": 0.1980379572751444, + "learning_rate": 0.00016039424222976073, + "loss": 0.875, + "mean_token_accuracy": 0.7392898082733155, + "num_tokens": 49963324.0, + "step": 21600 + }, + { + "epoch": 0.19812964151462364, + "learning_rate": 0.00016037590538186487, + "loss": 0.8745, + "mean_token_accuracy": 0.7357822299003601, + "num_tokens": 49986258.0, + "step": 21610 + }, + { + "epoch": 0.19822132575410287, + "learning_rate": 0.000160357568533969, + "loss": 0.8493, + "mean_token_accuracy": 0.743507343530655, + "num_tokens": 50009885.0, + "step": 21620 + }, + { + "epoch": 0.1983130099935821, + "learning_rate": 0.00016033923168607317, + "loss": 0.871, + "mean_token_accuracy": 0.7407045245170594, + "num_tokens": 50033198.0, + "step": 21630 + }, + { + "epoch": 0.19840469423306134, + "learning_rate": 0.0001603208948381773, + "loss": 0.8676, + "mean_token_accuracy": 0.7428215622901917, + "num_tokens": 50055204.0, + "step": 21640 + }, + { + "epoch": 0.19849637847254056, + "learning_rate": 0.0001603025579902815, + "loss": 0.8806, + "mean_token_accuracy": 0.7379589200019836, + "num_tokens": 50078253.0, + "step": 21650 + }, + { + "epoch": 0.1985880627120198, + "learning_rate": 0.00016028422114238564, + "loss": 0.849, + "mean_token_accuracy": 0.7472977638244629, + "num_tokens": 50101847.0, + "step": 21660 + }, + { + "epoch": 0.19867974695149904, + "learning_rate": 0.00016026588429448978, + "loss": 0.9058, + "mean_token_accuracy": 0.7337198078632354, + "num_tokens": 50125764.0, + "step": 21670 + }, + { + "epoch": 0.19877143119097826, + "learning_rate": 0.00016024754744659394, + "loss": 0.8531, + "mean_token_accuracy": 0.747775810956955, + "num_tokens": 50148979.0, + "step": 21680 + }, + { + "epoch": 0.1988631154304575, + "learning_rate": 0.00016022921059869808, + "loss": 0.8592, + "mean_token_accuracy": 0.7430618703365326, + "num_tokens": 50171941.0, + "step": 21690 + }, + { + "epoch": 0.19895479966993673, + "learning_rate": 0.00016021087375080225, + "loss": 0.8623, + "mean_token_accuracy": 0.7450705766677856, + "num_tokens": 50195318.0, + "step": 21700 + }, + { + "epoch": 0.19904648390941598, + "learning_rate": 0.00016019253690290638, + "loss": 0.8357, + "mean_token_accuracy": 0.7473804354667664, + "num_tokens": 50219248.0, + "step": 21710 + }, + { + "epoch": 0.1991381681488952, + "learning_rate": 0.00016017420005501055, + "loss": 0.8357, + "mean_token_accuracy": 0.7460615515708924, + "num_tokens": 50241914.0, + "step": 21720 + }, + { + "epoch": 0.19922985238837443, + "learning_rate": 0.00016015586320711472, + "loss": 0.863, + "mean_token_accuracy": 0.7443862438201905, + "num_tokens": 50264705.0, + "step": 21730 + }, + { + "epoch": 0.19932153662785368, + "learning_rate": 0.00016013752635921885, + "loss": 0.808, + "mean_token_accuracy": 0.7541323065757751, + "num_tokens": 50288411.0, + "step": 21740 + }, + { + "epoch": 0.1994132208673329, + "learning_rate": 0.00016011918951132302, + "loss": 0.8671, + "mean_token_accuracy": 0.7393250286579132, + "num_tokens": 50310524.0, + "step": 21750 + }, + { + "epoch": 0.19950490510681215, + "learning_rate": 0.00016010085266342716, + "loss": 0.8577, + "mean_token_accuracy": 0.7456794321537018, + "num_tokens": 50332865.0, + "step": 21760 + }, + { + "epoch": 0.19959658934629138, + "learning_rate": 0.0001600825158155313, + "loss": 0.8613, + "mean_token_accuracy": 0.7444769442081451, + "num_tokens": 50356165.0, + "step": 21770 + }, + { + "epoch": 0.1996882735857706, + "learning_rate": 0.0001600641789676355, + "loss": 0.8371, + "mean_token_accuracy": 0.7507792174816131, + "num_tokens": 50378823.0, + "step": 21780 + }, + { + "epoch": 0.19977995782524985, + "learning_rate": 0.00016004584211973963, + "loss": 0.8438, + "mean_token_accuracy": 0.7494022369384765, + "num_tokens": 50401408.0, + "step": 21790 + }, + { + "epoch": 0.19987164206472907, + "learning_rate": 0.0001600275052718438, + "loss": 0.8709, + "mean_token_accuracy": 0.7419447243213654, + "num_tokens": 50424655.0, + "step": 21800 + }, + { + "epoch": 0.1999633263042083, + "learning_rate": 0.00016000916842394793, + "loss": 0.8819, + "mean_token_accuracy": 0.7361635088920593, + "num_tokens": 50448104.0, + "step": 21810 + }, + { + "epoch": 0.20005501054368754, + "learning_rate": 0.00015999083157605207, + "loss": 0.8324, + "mean_token_accuracy": 0.7455726146697998, + "num_tokens": 50471452.0, + "step": 21820 + }, + { + "epoch": 0.20014669478316677, + "learning_rate": 0.00015997249472815623, + "loss": 0.8786, + "mean_token_accuracy": 0.7404028177261353, + "num_tokens": 50494949.0, + "step": 21830 + }, + { + "epoch": 0.20023837902264602, + "learning_rate": 0.00015995415788026037, + "loss": 0.8469, + "mean_token_accuracy": 0.7435766935348511, + "num_tokens": 50518380.0, + "step": 21840 + }, + { + "epoch": 0.20033006326212524, + "learning_rate": 0.00015993582103236456, + "loss": 0.8832, + "mean_token_accuracy": 0.7396993160247802, + "num_tokens": 50541556.0, + "step": 21850 + }, + { + "epoch": 0.20042174750160446, + "learning_rate": 0.0001599174841844687, + "loss": 0.8682, + "mean_token_accuracy": 0.7403628826141357, + "num_tokens": 50565156.0, + "step": 21860 + }, + { + "epoch": 0.20051343174108371, + "learning_rate": 0.00015989914733657284, + "loss": 0.808, + "mean_token_accuracy": 0.7503013730049133, + "num_tokens": 50588472.0, + "step": 21870 + }, + { + "epoch": 0.20060511598056294, + "learning_rate": 0.000159880810488677, + "loss": 0.8249, + "mean_token_accuracy": 0.7554940998554229, + "num_tokens": 50611909.0, + "step": 21880 + }, + { + "epoch": 0.2006968002200422, + "learning_rate": 0.00015986247364078115, + "loss": 0.8751, + "mean_token_accuracy": 0.7415297389030456, + "num_tokens": 50635149.0, + "step": 21890 + }, + { + "epoch": 0.2007884844595214, + "learning_rate": 0.0001598441367928853, + "loss": 0.854, + "mean_token_accuracy": 0.7425120592117309, + "num_tokens": 50658808.0, + "step": 21900 + }, + { + "epoch": 0.20088016869900063, + "learning_rate": 0.00015982579994498948, + "loss": 0.883, + "mean_token_accuracy": 0.7333277583122253, + "num_tokens": 50682479.0, + "step": 21910 + }, + { + "epoch": 0.20097185293847988, + "learning_rate": 0.00015980746309709361, + "loss": 0.8342, + "mean_token_accuracy": 0.7389296174049378, + "num_tokens": 50705643.0, + "step": 21920 + }, + { + "epoch": 0.2010635371779591, + "learning_rate": 0.00015978912624919778, + "loss": 0.8686, + "mean_token_accuracy": 0.7412992298603058, + "num_tokens": 50729130.0, + "step": 21930 + }, + { + "epoch": 0.20115522141743833, + "learning_rate": 0.00015977078940130192, + "loss": 0.8876, + "mean_token_accuracy": 0.7428201913833619, + "num_tokens": 50752283.0, + "step": 21940 + }, + { + "epoch": 0.20124690565691758, + "learning_rate": 0.00015975245255340608, + "loss": 0.8699, + "mean_token_accuracy": 0.7395201802253724, + "num_tokens": 50775140.0, + "step": 21950 + }, + { + "epoch": 0.2013385898963968, + "learning_rate": 0.00015973411570551022, + "loss": 0.8461, + "mean_token_accuracy": 0.7436147034168243, + "num_tokens": 50798527.0, + "step": 21960 + }, + { + "epoch": 0.20143027413587605, + "learning_rate": 0.00015971577885761436, + "loss": 0.8824, + "mean_token_accuracy": 0.7316768348217011, + "num_tokens": 50821745.0, + "step": 21970 + }, + { + "epoch": 0.20152195837535528, + "learning_rate": 0.00015969744200971855, + "loss": 0.8418, + "mean_token_accuracy": 0.7444996953010559, + "num_tokens": 50844569.0, + "step": 21980 + }, + { + "epoch": 0.2016136426148345, + "learning_rate": 0.0001596791051618227, + "loss": 0.8546, + "mean_token_accuracy": 0.7404028832912445, + "num_tokens": 50866994.0, + "step": 21990 + }, + { + "epoch": 0.20170532685431375, + "learning_rate": 0.00015966076831392686, + "loss": 0.8609, + "mean_token_accuracy": 0.7448885262012481, + "num_tokens": 50890498.0, + "step": 22000 + }, + { + "epoch": 0.20179701109379297, + "learning_rate": 0.000159642431466031, + "loss": 0.8859, + "mean_token_accuracy": 0.7408232808113098, + "num_tokens": 50913991.0, + "step": 22010 + }, + { + "epoch": 0.20188869533327222, + "learning_rate": 0.00015962409461813513, + "loss": 0.8137, + "mean_token_accuracy": 0.7524222314357758, + "num_tokens": 50936393.0, + "step": 22020 + }, + { + "epoch": 0.20198037957275145, + "learning_rate": 0.0001596057577702393, + "loss": 0.843, + "mean_token_accuracy": 0.7503765940666198, + "num_tokens": 50959777.0, + "step": 22030 + }, + { + "epoch": 0.20207206381223067, + "learning_rate": 0.00015958742092234346, + "loss": 0.8863, + "mean_token_accuracy": 0.7385656297206878, + "num_tokens": 50982461.0, + "step": 22040 + }, + { + "epoch": 0.20216374805170992, + "learning_rate": 0.00015956908407444763, + "loss": 0.8567, + "mean_token_accuracy": 0.7457262992858886, + "num_tokens": 51005599.0, + "step": 22050 + }, + { + "epoch": 0.20225543229118914, + "learning_rate": 0.00015955074722655177, + "loss": 0.8588, + "mean_token_accuracy": 0.7431886255741119, + "num_tokens": 51027794.0, + "step": 22060 + }, + { + "epoch": 0.2023471165306684, + "learning_rate": 0.0001595324103786559, + "loss": 0.8501, + "mean_token_accuracy": 0.7480876386165619, + "num_tokens": 51050893.0, + "step": 22070 + }, + { + "epoch": 0.20243880077014761, + "learning_rate": 0.00015951407353076007, + "loss": 0.902, + "mean_token_accuracy": 0.7377268075942993, + "num_tokens": 51074288.0, + "step": 22080 + }, + { + "epoch": 0.20253048500962684, + "learning_rate": 0.0001594957366828642, + "loss": 0.8679, + "mean_token_accuracy": 0.7407731413841248, + "num_tokens": 51097035.0, + "step": 22090 + }, + { + "epoch": 0.2026221692491061, + "learning_rate": 0.00015947739983496838, + "loss": 0.8568, + "mean_token_accuracy": 0.7497326552867889, + "num_tokens": 51120737.0, + "step": 22100 + }, + { + "epoch": 0.2027138534885853, + "learning_rate": 0.00015945906298707254, + "loss": 0.8569, + "mean_token_accuracy": 0.749122929573059, + "num_tokens": 51143780.0, + "step": 22110 + }, + { + "epoch": 0.20280553772806453, + "learning_rate": 0.00015944072613917668, + "loss": 0.8325, + "mean_token_accuracy": 0.744272917509079, + "num_tokens": 51166455.0, + "step": 22120 + }, + { + "epoch": 0.20289722196754378, + "learning_rate": 0.00015942238929128084, + "loss": 0.8636, + "mean_token_accuracy": 0.7408117949962616, + "num_tokens": 51189569.0, + "step": 22130 + }, + { + "epoch": 0.202988906207023, + "learning_rate": 0.00015940405244338498, + "loss": 0.866, + "mean_token_accuracy": 0.7365211248397827, + "num_tokens": 51212350.0, + "step": 22140 + }, + { + "epoch": 0.20308059044650226, + "learning_rate": 0.00015938571559548915, + "loss": 0.8369, + "mean_token_accuracy": 0.7488377571105957, + "num_tokens": 51235842.0, + "step": 22150 + }, + { + "epoch": 0.20317227468598148, + "learning_rate": 0.00015936737874759329, + "loss": 0.8661, + "mean_token_accuracy": 0.7402497053146362, + "num_tokens": 51259259.0, + "step": 22160 + }, + { + "epoch": 0.2032639589254607, + "learning_rate": 0.00015934904189969745, + "loss": 0.845, + "mean_token_accuracy": 0.7476921737194061, + "num_tokens": 51282364.0, + "step": 22170 + }, + { + "epoch": 0.20335564316493995, + "learning_rate": 0.00015933070505180162, + "loss": 0.8867, + "mean_token_accuracy": 0.7382035672664642, + "num_tokens": 51305531.0, + "step": 22180 + }, + { + "epoch": 0.20344732740441918, + "learning_rate": 0.00015931236820390576, + "loss": 0.8485, + "mean_token_accuracy": 0.7433157622814178, + "num_tokens": 51329112.0, + "step": 22190 + }, + { + "epoch": 0.20353901164389843, + "learning_rate": 0.00015929403135600992, + "loss": 0.8683, + "mean_token_accuracy": 0.7413956165313721, + "num_tokens": 51351873.0, + "step": 22200 + }, + { + "epoch": 0.20363069588337765, + "learning_rate": 0.00015927569450811406, + "loss": 0.8801, + "mean_token_accuracy": 0.7334484934806824, + "num_tokens": 51375100.0, + "step": 22210 + }, + { + "epoch": 0.20372238012285687, + "learning_rate": 0.0001592573576602182, + "loss": 0.836, + "mean_token_accuracy": 0.7457320809364318, + "num_tokens": 51398266.0, + "step": 22220 + }, + { + "epoch": 0.20381406436233612, + "learning_rate": 0.00015923902081232236, + "loss": 0.848, + "mean_token_accuracy": 0.7472280204296112, + "num_tokens": 51421399.0, + "step": 22230 + }, + { + "epoch": 0.20390574860181535, + "learning_rate": 0.00015922068396442653, + "loss": 0.8668, + "mean_token_accuracy": 0.7409771323204041, + "num_tokens": 51444216.0, + "step": 22240 + }, + { + "epoch": 0.20399743284129457, + "learning_rate": 0.0001592023471165307, + "loss": 0.8599, + "mean_token_accuracy": 0.7456480145454407, + "num_tokens": 51467897.0, + "step": 22250 + }, + { + "epoch": 0.20408911708077382, + "learning_rate": 0.00015918401026863483, + "loss": 0.9041, + "mean_token_accuracy": 0.7344803214073181, + "num_tokens": 51491731.0, + "step": 22260 + }, + { + "epoch": 0.20418080132025304, + "learning_rate": 0.00015916567342073897, + "loss": 0.8589, + "mean_token_accuracy": 0.7416087329387665, + "num_tokens": 51514964.0, + "step": 22270 + }, + { + "epoch": 0.2042724855597323, + "learning_rate": 0.00015914733657284314, + "loss": 0.8465, + "mean_token_accuracy": 0.7430679261684418, + "num_tokens": 51538211.0, + "step": 22280 + }, + { + "epoch": 0.20436416979921151, + "learning_rate": 0.00015912899972494727, + "loss": 0.8652, + "mean_token_accuracy": 0.7441716909408569, + "num_tokens": 51561928.0, + "step": 22290 + }, + { + "epoch": 0.20445585403869074, + "learning_rate": 0.00015911066287705144, + "loss": 0.8686, + "mean_token_accuracy": 0.7427517771720886, + "num_tokens": 51584876.0, + "step": 22300 + }, + { + "epoch": 0.20454753827817, + "learning_rate": 0.0001590923260291556, + "loss": 0.8532, + "mean_token_accuracy": 0.7431596398353577, + "num_tokens": 51607025.0, + "step": 22310 + }, + { + "epoch": 0.2046392225176492, + "learning_rate": 0.00015907398918125974, + "loss": 0.8465, + "mean_token_accuracy": 0.7427390575408935, + "num_tokens": 51630064.0, + "step": 22320 + }, + { + "epoch": 0.20473090675712846, + "learning_rate": 0.0001590556523333639, + "loss": 0.8438, + "mean_token_accuracy": 0.7487075865268707, + "num_tokens": 51653929.0, + "step": 22330 + }, + { + "epoch": 0.20482259099660768, + "learning_rate": 0.00015903731548546805, + "loss": 0.8777, + "mean_token_accuracy": 0.7471191346645355, + "num_tokens": 51677171.0, + "step": 22340 + }, + { + "epoch": 0.2049142752360869, + "learning_rate": 0.0001590189786375722, + "loss": 0.8467, + "mean_token_accuracy": 0.7524676620960236, + "num_tokens": 51699778.0, + "step": 22350 + }, + { + "epoch": 0.20500595947556616, + "learning_rate": 0.00015900064178967635, + "loss": 0.8833, + "mean_token_accuracy": 0.7445943593978882, + "num_tokens": 51722784.0, + "step": 22360 + }, + { + "epoch": 0.20509764371504538, + "learning_rate": 0.00015898230494178052, + "loss": 0.8436, + "mean_token_accuracy": 0.7526306509971619, + "num_tokens": 51744504.0, + "step": 22370 + }, + { + "epoch": 0.20518932795452463, + "learning_rate": 0.00015896396809388468, + "loss": 0.8334, + "mean_token_accuracy": 0.7482061982154846, + "num_tokens": 51768151.0, + "step": 22380 + }, + { + "epoch": 0.20528101219400385, + "learning_rate": 0.00015894563124598882, + "loss": 0.8553, + "mean_token_accuracy": 0.746174567937851, + "num_tokens": 51790906.0, + "step": 22390 + }, + { + "epoch": 0.20537269643348308, + "learning_rate": 0.00015892729439809299, + "loss": 0.8952, + "mean_token_accuracy": 0.7336604475975037, + "num_tokens": 51813564.0, + "step": 22400 + }, + { + "epoch": 0.20546438067296233, + "learning_rate": 0.00015890895755019712, + "loss": 0.8645, + "mean_token_accuracy": 0.7384875535964965, + "num_tokens": 51836941.0, + "step": 22410 + }, + { + "epoch": 0.20555606491244155, + "learning_rate": 0.00015889062070230126, + "loss": 0.8725, + "mean_token_accuracy": 0.7424970269203186, + "num_tokens": 51859858.0, + "step": 22420 + }, + { + "epoch": 0.20564774915192077, + "learning_rate": 0.00015887228385440545, + "loss": 0.8631, + "mean_token_accuracy": 0.7439145982265473, + "num_tokens": 51883311.0, + "step": 22430 + }, + { + "epoch": 0.20573943339140002, + "learning_rate": 0.0001588539470065096, + "loss": 0.8685, + "mean_token_accuracy": 0.7378161787986756, + "num_tokens": 51906335.0, + "step": 22440 + }, + { + "epoch": 0.20583111763087925, + "learning_rate": 0.00015883561015861376, + "loss": 0.8401, + "mean_token_accuracy": 0.7537043929100037, + "num_tokens": 51930121.0, + "step": 22450 + }, + { + "epoch": 0.2059228018703585, + "learning_rate": 0.0001588172733107179, + "loss": 0.8656, + "mean_token_accuracy": 0.7449964284896851, + "num_tokens": 51952639.0, + "step": 22460 + }, + { + "epoch": 0.20601448610983772, + "learning_rate": 0.00015879893646282203, + "loss": 0.8344, + "mean_token_accuracy": 0.7512423753738403, + "num_tokens": 51975722.0, + "step": 22470 + }, + { + "epoch": 0.20610617034931694, + "learning_rate": 0.0001587805996149262, + "loss": 0.8424, + "mean_token_accuracy": 0.7491206347942352, + "num_tokens": 51998867.0, + "step": 22480 + }, + { + "epoch": 0.2061978545887962, + "learning_rate": 0.00015876226276703034, + "loss": 0.8375, + "mean_token_accuracy": 0.7521736443042755, + "num_tokens": 52022136.0, + "step": 22490 + }, + { + "epoch": 0.20628953882827541, + "learning_rate": 0.0001587439259191345, + "loss": 0.8272, + "mean_token_accuracy": 0.7509084165096283, + "num_tokens": 52045455.0, + "step": 22500 + }, + { + "epoch": 0.20638122306775467, + "learning_rate": 0.00015872558907123867, + "loss": 0.8828, + "mean_token_accuracy": 0.7422175109386444, + "num_tokens": 52069071.0, + "step": 22510 + }, + { + "epoch": 0.2064729073072339, + "learning_rate": 0.0001587072522233428, + "loss": 0.8857, + "mean_token_accuracy": 0.734280240535736, + "num_tokens": 52092525.0, + "step": 22520 + }, + { + "epoch": 0.2065645915467131, + "learning_rate": 0.00015868891537544697, + "loss": 0.8607, + "mean_token_accuracy": 0.746072632074356, + "num_tokens": 52115754.0, + "step": 22530 + }, + { + "epoch": 0.20665627578619236, + "learning_rate": 0.0001586705785275511, + "loss": 0.9128, + "mean_token_accuracy": 0.7358653903007507, + "num_tokens": 52138986.0, + "step": 22540 + }, + { + "epoch": 0.20674796002567158, + "learning_rate": 0.00015865224167965528, + "loss": 0.8529, + "mean_token_accuracy": 0.743468987941742, + "num_tokens": 52161991.0, + "step": 22550 + }, + { + "epoch": 0.2068396442651508, + "learning_rate": 0.00015863390483175944, + "loss": 0.868, + "mean_token_accuracy": 0.7468756318092347, + "num_tokens": 52185451.0, + "step": 22560 + }, + { + "epoch": 0.20693132850463006, + "learning_rate": 0.00015861556798386358, + "loss": 0.8723, + "mean_token_accuracy": 0.7450823128223419, + "num_tokens": 52208249.0, + "step": 22570 + }, + { + "epoch": 0.20702301274410928, + "learning_rate": 0.00015859723113596775, + "loss": 0.8629, + "mean_token_accuracy": 0.7449024319648743, + "num_tokens": 52231571.0, + "step": 22580 + }, + { + "epoch": 0.20711469698358853, + "learning_rate": 0.00015857889428807188, + "loss": 0.8236, + "mean_token_accuracy": 0.7532026469707489, + "num_tokens": 52254458.0, + "step": 22590 + }, + { + "epoch": 0.20720638122306775, + "learning_rate": 0.00015856055744017605, + "loss": 0.8853, + "mean_token_accuracy": 0.7419590651988983, + "num_tokens": 52277353.0, + "step": 22600 + }, + { + "epoch": 0.20729806546254698, + "learning_rate": 0.0001585422205922802, + "loss": 0.8797, + "mean_token_accuracy": 0.7334124922752381, + "num_tokens": 52300646.0, + "step": 22610 + }, + { + "epoch": 0.20738974970202623, + "learning_rate": 0.00015852388374438433, + "loss": 0.8706, + "mean_token_accuracy": 0.741769301891327, + "num_tokens": 52323640.0, + "step": 22620 + }, + { + "epoch": 0.20748143394150545, + "learning_rate": 0.00015850554689648852, + "loss": 0.8591, + "mean_token_accuracy": 0.7348312199115753, + "num_tokens": 52347076.0, + "step": 22630 + }, + { + "epoch": 0.2075731181809847, + "learning_rate": 0.00015848721004859266, + "loss": 0.8921, + "mean_token_accuracy": 0.7361427903175354, + "num_tokens": 52370014.0, + "step": 22640 + }, + { + "epoch": 0.20766480242046392, + "learning_rate": 0.00015846887320069682, + "loss": 0.8396, + "mean_token_accuracy": 0.7475686013698578, + "num_tokens": 52393061.0, + "step": 22650 + }, + { + "epoch": 0.20775648665994315, + "learning_rate": 0.00015845053635280096, + "loss": 0.8745, + "mean_token_accuracy": 0.7397183537483215, + "num_tokens": 52415796.0, + "step": 22660 + }, + { + "epoch": 0.2078481708994224, + "learning_rate": 0.0001584321995049051, + "loss": 0.8597, + "mean_token_accuracy": 0.7469383776187897, + "num_tokens": 52438316.0, + "step": 22670 + }, + { + "epoch": 0.20793985513890162, + "learning_rate": 0.00015841386265700926, + "loss": 0.8568, + "mean_token_accuracy": 0.7485611915588379, + "num_tokens": 52462059.0, + "step": 22680 + }, + { + "epoch": 0.20803153937838087, + "learning_rate": 0.00015839552580911343, + "loss": 0.8955, + "mean_token_accuracy": 0.7418225705623627, + "num_tokens": 52484563.0, + "step": 22690 + }, + { + "epoch": 0.2081232236178601, + "learning_rate": 0.00015837718896121757, + "loss": 0.896, + "mean_token_accuracy": 0.732795125246048, + "num_tokens": 52507688.0, + "step": 22700 + }, + { + "epoch": 0.20821490785733932, + "learning_rate": 0.00015835885211332173, + "loss": 0.8542, + "mean_token_accuracy": 0.7425751388072968, + "num_tokens": 52531415.0, + "step": 22710 + }, + { + "epoch": 0.20830659209681857, + "learning_rate": 0.00015834051526542587, + "loss": 0.8711, + "mean_token_accuracy": 0.7430127382278442, + "num_tokens": 52554075.0, + "step": 22720 + }, + { + "epoch": 0.2083982763362978, + "learning_rate": 0.00015832217841753004, + "loss": 0.8284, + "mean_token_accuracy": 0.74892458319664, + "num_tokens": 52576818.0, + "step": 22730 + }, + { + "epoch": 0.208489960575777, + "learning_rate": 0.00015830384156963418, + "loss": 0.8636, + "mean_token_accuracy": 0.7368107259273529, + "num_tokens": 52600359.0, + "step": 22740 + }, + { + "epoch": 0.20858164481525626, + "learning_rate": 0.00015828550472173834, + "loss": 0.8554, + "mean_token_accuracy": 0.7400186717510223, + "num_tokens": 52624016.0, + "step": 22750 + }, + { + "epoch": 0.20867332905473548, + "learning_rate": 0.0001582671678738425, + "loss": 0.8558, + "mean_token_accuracy": 0.7459397435188293, + "num_tokens": 52647758.0, + "step": 22760 + }, + { + "epoch": 0.20876501329421474, + "learning_rate": 0.00015824883102594665, + "loss": 0.8173, + "mean_token_accuracy": 0.7541181325912476, + "num_tokens": 52670209.0, + "step": 22770 + }, + { + "epoch": 0.20885669753369396, + "learning_rate": 0.0001582304941780508, + "loss": 0.8528, + "mean_token_accuracy": 0.7441991806030274, + "num_tokens": 52693886.0, + "step": 22780 + }, + { + "epoch": 0.20894838177317318, + "learning_rate": 0.00015821215733015495, + "loss": 0.8656, + "mean_token_accuracy": 0.7385231554508209, + "num_tokens": 52717927.0, + "step": 22790 + }, + { + "epoch": 0.20904006601265243, + "learning_rate": 0.00015819382048225911, + "loss": 0.8811, + "mean_token_accuracy": 0.7368879735469818, + "num_tokens": 52740786.0, + "step": 22800 + }, + { + "epoch": 0.20913175025213165, + "learning_rate": 0.00015817548363436325, + "loss": 0.8763, + "mean_token_accuracy": 0.7419000327587127, + "num_tokens": 52764240.0, + "step": 22810 + }, + { + "epoch": 0.2092234344916109, + "learning_rate": 0.0001581571467864674, + "loss": 0.8755, + "mean_token_accuracy": 0.7437607824802399, + "num_tokens": 52787198.0, + "step": 22820 + }, + { + "epoch": 0.20931511873109013, + "learning_rate": 0.00015813880993857158, + "loss": 0.8601, + "mean_token_accuracy": 0.7427997291088104, + "num_tokens": 52810972.0, + "step": 22830 + }, + { + "epoch": 0.20940680297056935, + "learning_rate": 0.00015812047309067572, + "loss": 0.825, + "mean_token_accuracy": 0.7468115806579589, + "num_tokens": 52833364.0, + "step": 22840 + }, + { + "epoch": 0.2094984872100486, + "learning_rate": 0.0001581021362427799, + "loss": 0.8593, + "mean_token_accuracy": 0.7529172241687775, + "num_tokens": 52856738.0, + "step": 22850 + }, + { + "epoch": 0.20959017144952782, + "learning_rate": 0.00015808379939488403, + "loss": 0.8411, + "mean_token_accuracy": 0.7520411849021912, + "num_tokens": 52879726.0, + "step": 22860 + }, + { + "epoch": 0.20968185568900705, + "learning_rate": 0.00015806546254698816, + "loss": 0.8556, + "mean_token_accuracy": 0.7454691350460052, + "num_tokens": 52903323.0, + "step": 22870 + }, + { + "epoch": 0.2097735399284863, + "learning_rate": 0.00015804712569909233, + "loss": 0.8305, + "mean_token_accuracy": 0.7444688558578492, + "num_tokens": 52927232.0, + "step": 22880 + }, + { + "epoch": 0.20986522416796552, + "learning_rate": 0.0001580287888511965, + "loss": 0.8174, + "mean_token_accuracy": 0.751531845331192, + "num_tokens": 52950700.0, + "step": 22890 + }, + { + "epoch": 0.20995690840744477, + "learning_rate": 0.00015801045200330063, + "loss": 0.8397, + "mean_token_accuracy": 0.7518243432044983, + "num_tokens": 52973978.0, + "step": 22900 + }, + { + "epoch": 0.210048592646924, + "learning_rate": 0.0001579921151554048, + "loss": 0.826, + "mean_token_accuracy": 0.7524587571620941, + "num_tokens": 52996751.0, + "step": 22910 + }, + { + "epoch": 0.21014027688640322, + "learning_rate": 0.00015797377830750894, + "loss": 0.8327, + "mean_token_accuracy": 0.7447079837322235, + "num_tokens": 53020346.0, + "step": 22920 + }, + { + "epoch": 0.21023196112588247, + "learning_rate": 0.0001579554414596131, + "loss": 0.8493, + "mean_token_accuracy": 0.7439808189868927, + "num_tokens": 53043552.0, + "step": 22930 + }, + { + "epoch": 0.2103236453653617, + "learning_rate": 0.00015793710461171724, + "loss": 0.8561, + "mean_token_accuracy": 0.7447343707084656, + "num_tokens": 53066439.0, + "step": 22940 + }, + { + "epoch": 0.21041532960484094, + "learning_rate": 0.0001579187677638214, + "loss": 0.8901, + "mean_token_accuracy": 0.7344002246856689, + "num_tokens": 53089696.0, + "step": 22950 + }, + { + "epoch": 0.21050701384432016, + "learning_rate": 0.00015790043091592557, + "loss": 0.8451, + "mean_token_accuracy": 0.7429101884365081, + "num_tokens": 53112911.0, + "step": 22960 + }, + { + "epoch": 0.21059869808379938, + "learning_rate": 0.0001578820940680297, + "loss": 0.887, + "mean_token_accuracy": 0.7421387135982513, + "num_tokens": 53136508.0, + "step": 22970 + }, + { + "epoch": 0.21069038232327864, + "learning_rate": 0.00015786375722013388, + "loss": 0.8485, + "mean_token_accuracy": 0.7438655614852905, + "num_tokens": 53159562.0, + "step": 22980 + }, + { + "epoch": 0.21078206656275786, + "learning_rate": 0.000157845420372238, + "loss": 0.8742, + "mean_token_accuracy": 0.738437169790268, + "num_tokens": 53182338.0, + "step": 22990 + }, + { + "epoch": 0.2108737508022371, + "learning_rate": 0.00015782708352434218, + "loss": 0.8638, + "mean_token_accuracy": 0.7404647469520569, + "num_tokens": 53205760.0, + "step": 23000 + }, + { + "epoch": 0.21096543504171633, + "learning_rate": 0.00015780874667644632, + "loss": 0.8652, + "mean_token_accuracy": 0.7402274906635284, + "num_tokens": 53229103.0, + "step": 23010 + }, + { + "epoch": 0.21105711928119555, + "learning_rate": 0.00015779040982855048, + "loss": 0.8204, + "mean_token_accuracy": 0.751193743944168, + "num_tokens": 53252856.0, + "step": 23020 + }, + { + "epoch": 0.2111488035206748, + "learning_rate": 0.00015777207298065465, + "loss": 0.8431, + "mean_token_accuracy": 0.7468126237392425, + "num_tokens": 53276558.0, + "step": 23030 + }, + { + "epoch": 0.21124048776015403, + "learning_rate": 0.00015775373613275879, + "loss": 0.8539, + "mean_token_accuracy": 0.7457605421543121, + "num_tokens": 53299878.0, + "step": 23040 + }, + { + "epoch": 0.21133217199963325, + "learning_rate": 0.00015773539928486295, + "loss": 0.8882, + "mean_token_accuracy": 0.7381194353103637, + "num_tokens": 53322991.0, + "step": 23050 + }, + { + "epoch": 0.2114238562391125, + "learning_rate": 0.0001577170624369671, + "loss": 0.8492, + "mean_token_accuracy": 0.7466514110565186, + "num_tokens": 53346031.0, + "step": 23060 + }, + { + "epoch": 0.21151554047859172, + "learning_rate": 0.00015769872558907123, + "loss": 0.8339, + "mean_token_accuracy": 0.748447859287262, + "num_tokens": 53368430.0, + "step": 23070 + }, + { + "epoch": 0.21160722471807097, + "learning_rate": 0.0001576803887411754, + "loss": 0.8542, + "mean_token_accuracy": 0.7409026741981506, + "num_tokens": 53391918.0, + "step": 23080 + }, + { + "epoch": 0.2116989089575502, + "learning_rate": 0.00015766205189327956, + "loss": 0.8305, + "mean_token_accuracy": 0.7559028267860413, + "num_tokens": 53413879.0, + "step": 23090 + }, + { + "epoch": 0.21179059319702942, + "learning_rate": 0.0001576437150453837, + "loss": 0.8745, + "mean_token_accuracy": 0.7381623983383179, + "num_tokens": 53437667.0, + "step": 23100 + }, + { + "epoch": 0.21188227743650867, + "learning_rate": 0.00015762537819748786, + "loss": 0.7952, + "mean_token_accuracy": 0.7536631882190704, + "num_tokens": 53461367.0, + "step": 23110 + }, + { + "epoch": 0.2119739616759879, + "learning_rate": 0.000157607041349592, + "loss": 0.8783, + "mean_token_accuracy": 0.7351391434669494, + "num_tokens": 53483854.0, + "step": 23120 + }, + { + "epoch": 0.21206564591546714, + "learning_rate": 0.00015758870450169617, + "loss": 0.8452, + "mean_token_accuracy": 0.7492637693881988, + "num_tokens": 53506978.0, + "step": 23130 + }, + { + "epoch": 0.21215733015494637, + "learning_rate": 0.0001575703676538003, + "loss": 0.8812, + "mean_token_accuracy": 0.7430793285369873, + "num_tokens": 53529964.0, + "step": 23140 + }, + { + "epoch": 0.2122490143944256, + "learning_rate": 0.00015755203080590447, + "loss": 0.8998, + "mean_token_accuracy": 0.734472805261612, + "num_tokens": 53553476.0, + "step": 23150 + }, + { + "epoch": 0.21234069863390484, + "learning_rate": 0.00015753369395800864, + "loss": 0.9035, + "mean_token_accuracy": 0.7372500181198121, + "num_tokens": 53576958.0, + "step": 23160 + }, + { + "epoch": 0.21243238287338406, + "learning_rate": 0.00015751535711011277, + "loss": 0.8651, + "mean_token_accuracy": 0.7355253279209137, + "num_tokens": 53599662.0, + "step": 23170 + }, + { + "epoch": 0.21252406711286329, + "learning_rate": 0.00015749702026221694, + "loss": 0.8762, + "mean_token_accuracy": 0.7412170886993408, + "num_tokens": 53622289.0, + "step": 23180 + }, + { + "epoch": 0.21261575135234254, + "learning_rate": 0.00015747868341432108, + "loss": 0.818, + "mean_token_accuracy": 0.7529448926448822, + "num_tokens": 53646308.0, + "step": 23190 + }, + { + "epoch": 0.21270743559182176, + "learning_rate": 0.00015746034656642524, + "loss": 0.8986, + "mean_token_accuracy": 0.7288304030895233, + "num_tokens": 53669551.0, + "step": 23200 + }, + { + "epoch": 0.212799119831301, + "learning_rate": 0.00015744200971852938, + "loss": 0.8444, + "mean_token_accuracy": 0.7498817265033721, + "num_tokens": 53693088.0, + "step": 23210 + }, + { + "epoch": 0.21289080407078023, + "learning_rate": 0.00015742367287063355, + "loss": 0.8121, + "mean_token_accuracy": 0.7579306125640869, + "num_tokens": 53715872.0, + "step": 23220 + }, + { + "epoch": 0.21298248831025945, + "learning_rate": 0.0001574053360227377, + "loss": 0.9312, + "mean_token_accuracy": 0.7323280274868011, + "num_tokens": 53739238.0, + "step": 23230 + }, + { + "epoch": 0.2130741725497387, + "learning_rate": 0.00015738699917484185, + "loss": 0.8538, + "mean_token_accuracy": 0.7449313700199127, + "num_tokens": 53762212.0, + "step": 23240 + }, + { + "epoch": 0.21316585678921793, + "learning_rate": 0.00015736866232694602, + "loss": 0.8477, + "mean_token_accuracy": 0.7526765108108521, + "num_tokens": 53785291.0, + "step": 23250 + }, + { + "epoch": 0.21325754102869718, + "learning_rate": 0.00015735032547905015, + "loss": 0.8426, + "mean_token_accuracy": 0.7461187839508057, + "num_tokens": 53807700.0, + "step": 23260 + }, + { + "epoch": 0.2133492252681764, + "learning_rate": 0.0001573319886311543, + "loss": 0.8775, + "mean_token_accuracy": 0.7434069573879242, + "num_tokens": 53830824.0, + "step": 23270 + }, + { + "epoch": 0.21344090950765562, + "learning_rate": 0.00015731365178325849, + "loss": 0.9066, + "mean_token_accuracy": 0.7361610054969787, + "num_tokens": 53855212.0, + "step": 23280 + }, + { + "epoch": 0.21353259374713487, + "learning_rate": 0.00015729531493536262, + "loss": 0.8844, + "mean_token_accuracy": 0.7391054093837738, + "num_tokens": 53877991.0, + "step": 23290 + }, + { + "epoch": 0.2136242779866141, + "learning_rate": 0.00015727697808746676, + "loss": 0.8158, + "mean_token_accuracy": 0.7555877804756165, + "num_tokens": 53900944.0, + "step": 23300 + }, + { + "epoch": 0.21371596222609335, + "learning_rate": 0.00015725864123957093, + "loss": 0.8358, + "mean_token_accuracy": 0.7458467245101928, + "num_tokens": 53923949.0, + "step": 23310 + }, + { + "epoch": 0.21380764646557257, + "learning_rate": 0.00015724030439167507, + "loss": 0.8638, + "mean_token_accuracy": 0.7416692852973938, + "num_tokens": 53946905.0, + "step": 23320 + }, + { + "epoch": 0.2138993307050518, + "learning_rate": 0.00015722196754377923, + "loss": 0.8507, + "mean_token_accuracy": 0.7485923886299133, + "num_tokens": 53969557.0, + "step": 23330 + }, + { + "epoch": 0.21399101494453104, + "learning_rate": 0.00015720363069588337, + "loss": 0.8635, + "mean_token_accuracy": 0.7405233025550843, + "num_tokens": 53993251.0, + "step": 23340 + }, + { + "epoch": 0.21408269918401027, + "learning_rate": 0.00015718529384798753, + "loss": 0.8375, + "mean_token_accuracy": 0.7482027769088745, + "num_tokens": 54016482.0, + "step": 23350 + }, + { + "epoch": 0.2141743834234895, + "learning_rate": 0.0001571669570000917, + "loss": 0.8301, + "mean_token_accuracy": 0.7466087222099305, + "num_tokens": 54039231.0, + "step": 23360 + }, + { + "epoch": 0.21426606766296874, + "learning_rate": 0.00015714862015219584, + "loss": 0.8649, + "mean_token_accuracy": 0.7439805567264557, + "num_tokens": 54062281.0, + "step": 23370 + }, + { + "epoch": 0.21435775190244796, + "learning_rate": 0.0001571302833043, + "loss": 0.8523, + "mean_token_accuracy": 0.7457484066486358, + "num_tokens": 54085035.0, + "step": 23380 + }, + { + "epoch": 0.2144494361419272, + "learning_rate": 0.00015711194645640414, + "loss": 0.8878, + "mean_token_accuracy": 0.7381054818630218, + "num_tokens": 54108892.0, + "step": 23390 + }, + { + "epoch": 0.21454112038140644, + "learning_rate": 0.0001570936096085083, + "loss": 0.873, + "mean_token_accuracy": 0.7365092277526856, + "num_tokens": 54131651.0, + "step": 23400 + }, + { + "epoch": 0.21463280462088566, + "learning_rate": 0.00015707527276061247, + "loss": 0.8684, + "mean_token_accuracy": 0.7431603789329528, + "num_tokens": 54154336.0, + "step": 23410 + }, + { + "epoch": 0.2147244888603649, + "learning_rate": 0.0001570569359127166, + "loss": 0.883, + "mean_token_accuracy": 0.7376543760299683, + "num_tokens": 54177580.0, + "step": 23420 + }, + { + "epoch": 0.21481617309984413, + "learning_rate": 0.00015703859906482078, + "loss": 0.8711, + "mean_token_accuracy": 0.7387879192829132, + "num_tokens": 54201126.0, + "step": 23430 + }, + { + "epoch": 0.21490785733932338, + "learning_rate": 0.00015702026221692492, + "loss": 0.8437, + "mean_token_accuracy": 0.748453801870346, + "num_tokens": 54224885.0, + "step": 23440 + }, + { + "epoch": 0.2149995415788026, + "learning_rate": 0.00015700192536902908, + "loss": 0.8623, + "mean_token_accuracy": 0.7423072993755341, + "num_tokens": 54247480.0, + "step": 23450 + }, + { + "epoch": 0.21509122581828183, + "learning_rate": 0.00015698358852113322, + "loss": 0.8959, + "mean_token_accuracy": 0.7366766691207886, + "num_tokens": 54269692.0, + "step": 23460 + }, + { + "epoch": 0.21518291005776108, + "learning_rate": 0.00015696525167323736, + "loss": 0.8876, + "mean_token_accuracy": 0.737098115682602, + "num_tokens": 54292968.0, + "step": 23470 + }, + { + "epoch": 0.2152745942972403, + "learning_rate": 0.00015694691482534155, + "loss": 0.8866, + "mean_token_accuracy": 0.7405371010303498, + "num_tokens": 54316741.0, + "step": 23480 + }, + { + "epoch": 0.21536627853671952, + "learning_rate": 0.0001569285779774457, + "loss": 0.8566, + "mean_token_accuracy": 0.7423771560192108, + "num_tokens": 54339565.0, + "step": 23490 + }, + { + "epoch": 0.21545796277619877, + "learning_rate": 0.00015691024112954983, + "loss": 0.8331, + "mean_token_accuracy": 0.7455996751785279, + "num_tokens": 54363044.0, + "step": 23500 + }, + { + "epoch": 0.215549647015678, + "learning_rate": 0.000156891904281654, + "loss": 0.8933, + "mean_token_accuracy": 0.7349541306495666, + "num_tokens": 54385937.0, + "step": 23510 + }, + { + "epoch": 0.21564133125515725, + "learning_rate": 0.00015687356743375813, + "loss": 0.8642, + "mean_token_accuracy": 0.7499670505523681, + "num_tokens": 54408753.0, + "step": 23520 + }, + { + "epoch": 0.21573301549463647, + "learning_rate": 0.0001568552305858623, + "loss": 0.8648, + "mean_token_accuracy": 0.7448411345481872, + "num_tokens": 54431866.0, + "step": 23530 + }, + { + "epoch": 0.2158246997341157, + "learning_rate": 0.00015683689373796646, + "loss": 0.8593, + "mean_token_accuracy": 0.747662615776062, + "num_tokens": 54454634.0, + "step": 23540 + }, + { + "epoch": 0.21591638397359494, + "learning_rate": 0.0001568185568900706, + "loss": 0.8698, + "mean_token_accuracy": 0.744737309217453, + "num_tokens": 54477758.0, + "step": 23550 + }, + { + "epoch": 0.21600806821307417, + "learning_rate": 0.00015680022004217476, + "loss": 0.8384, + "mean_token_accuracy": 0.7470738470554352, + "num_tokens": 54501201.0, + "step": 23560 + }, + { + "epoch": 0.21609975245255342, + "learning_rate": 0.0001567818831942789, + "loss": 0.8633, + "mean_token_accuracy": 0.7414463341236115, + "num_tokens": 54524678.0, + "step": 23570 + }, + { + "epoch": 0.21619143669203264, + "learning_rate": 0.00015676354634638307, + "loss": 0.8578, + "mean_token_accuracy": 0.7483405590057373, + "num_tokens": 54547753.0, + "step": 23580 + }, + { + "epoch": 0.21628312093151186, + "learning_rate": 0.0001567452094984872, + "loss": 0.8498, + "mean_token_accuracy": 0.7444630563259125, + "num_tokens": 54570375.0, + "step": 23590 + }, + { + "epoch": 0.2163748051709911, + "learning_rate": 0.00015672687265059137, + "loss": 0.8685, + "mean_token_accuracy": 0.742591780424118, + "num_tokens": 54593404.0, + "step": 23600 + }, + { + "epoch": 0.21646648941047034, + "learning_rate": 0.00015670853580269554, + "loss": 0.857, + "mean_token_accuracy": 0.7420598983764648, + "num_tokens": 54617124.0, + "step": 23610 + }, + { + "epoch": 0.2165581736499496, + "learning_rate": 0.00015669019895479968, + "loss": 0.8402, + "mean_token_accuracy": 0.7527478635311127, + "num_tokens": 54640572.0, + "step": 23620 + }, + { + "epoch": 0.2166498578894288, + "learning_rate": 0.00015667186210690384, + "loss": 0.8273, + "mean_token_accuracy": 0.7498106837272644, + "num_tokens": 54664242.0, + "step": 23630 + }, + { + "epoch": 0.21674154212890803, + "learning_rate": 0.00015665352525900798, + "loss": 0.8275, + "mean_token_accuracy": 0.7492702424526214, + "num_tokens": 54687693.0, + "step": 23640 + }, + { + "epoch": 0.21683322636838728, + "learning_rate": 0.00015663518841111215, + "loss": 0.8802, + "mean_token_accuracy": 0.7409344494342804, + "num_tokens": 54711150.0, + "step": 23650 + }, + { + "epoch": 0.2169249106078665, + "learning_rate": 0.00015661685156321628, + "loss": 0.8867, + "mean_token_accuracy": 0.7304402410984039, + "num_tokens": 54733747.0, + "step": 23660 + }, + { + "epoch": 0.21701659484734573, + "learning_rate": 0.00015659851471532045, + "loss": 0.857, + "mean_token_accuracy": 0.747049993276596, + "num_tokens": 54756418.0, + "step": 23670 + }, + { + "epoch": 0.21710827908682498, + "learning_rate": 0.00015658017786742461, + "loss": 0.8784, + "mean_token_accuracy": 0.7382007956504821, + "num_tokens": 54779656.0, + "step": 23680 + }, + { + "epoch": 0.2171999633263042, + "learning_rate": 0.00015656184101952875, + "loss": 0.89, + "mean_token_accuracy": 0.7308126807212829, + "num_tokens": 54803066.0, + "step": 23690 + }, + { + "epoch": 0.21729164756578345, + "learning_rate": 0.0001565435041716329, + "loss": 0.8903, + "mean_token_accuracy": 0.7373201549053192, + "num_tokens": 54826372.0, + "step": 23700 + }, + { + "epoch": 0.21738333180526268, + "learning_rate": 0.00015652516732373706, + "loss": 0.8808, + "mean_token_accuracy": 0.7408906638622283, + "num_tokens": 54850113.0, + "step": 23710 + }, + { + "epoch": 0.2174750160447419, + "learning_rate": 0.0001565068304758412, + "loss": 0.8341, + "mean_token_accuracy": 0.7525183320045471, + "num_tokens": 54872989.0, + "step": 23720 + }, + { + "epoch": 0.21756670028422115, + "learning_rate": 0.00015648849362794536, + "loss": 0.8593, + "mean_token_accuracy": 0.7476661264896393, + "num_tokens": 54896134.0, + "step": 23730 + }, + { + "epoch": 0.21765838452370037, + "learning_rate": 0.00015647015678004953, + "loss": 0.8484, + "mean_token_accuracy": 0.750644987821579, + "num_tokens": 54918632.0, + "step": 23740 + }, + { + "epoch": 0.21775006876317962, + "learning_rate": 0.00015645181993215366, + "loss": 0.8577, + "mean_token_accuracy": 0.7441705107688904, + "num_tokens": 54941866.0, + "step": 23750 + }, + { + "epoch": 0.21784175300265884, + "learning_rate": 0.00015643348308425783, + "loss": 0.8242, + "mean_token_accuracy": 0.7528449773788453, + "num_tokens": 54964650.0, + "step": 23760 + }, + { + "epoch": 0.21793343724213807, + "learning_rate": 0.00015641514623636197, + "loss": 0.8757, + "mean_token_accuracy": 0.7425302565097809, + "num_tokens": 54987828.0, + "step": 23770 + }, + { + "epoch": 0.21802512148161732, + "learning_rate": 0.00015639680938846613, + "loss": 0.8637, + "mean_token_accuracy": 0.7403858184814454, + "num_tokens": 55011006.0, + "step": 23780 + }, + { + "epoch": 0.21811680572109654, + "learning_rate": 0.00015637847254057027, + "loss": 0.8804, + "mean_token_accuracy": 0.7361753046512604, + "num_tokens": 55033867.0, + "step": 23790 + }, + { + "epoch": 0.21820848996057576, + "learning_rate": 0.00015636013569267444, + "loss": 0.8673, + "mean_token_accuracy": 0.7374181807041168, + "num_tokens": 55057010.0, + "step": 23800 + }, + { + "epoch": 0.218300174200055, + "learning_rate": 0.0001563417988447786, + "loss": 0.8607, + "mean_token_accuracy": 0.7394064128398895, + "num_tokens": 55079738.0, + "step": 23810 + }, + { + "epoch": 0.21839185843953424, + "learning_rate": 0.00015632346199688274, + "loss": 0.8339, + "mean_token_accuracy": 0.7540367722511292, + "num_tokens": 55102910.0, + "step": 23820 + }, + { + "epoch": 0.2184835426790135, + "learning_rate": 0.0001563051251489869, + "loss": 0.8661, + "mean_token_accuracy": 0.7424493491649627, + "num_tokens": 55126616.0, + "step": 23830 + }, + { + "epoch": 0.2185752269184927, + "learning_rate": 0.00015628678830109104, + "loss": 0.8596, + "mean_token_accuracy": 0.7432507991790771, + "num_tokens": 55150326.0, + "step": 23840 + }, + { + "epoch": 0.21866691115797193, + "learning_rate": 0.0001562684514531952, + "loss": 0.8668, + "mean_token_accuracy": 0.7417873263359069, + "num_tokens": 55173701.0, + "step": 23850 + }, + { + "epoch": 0.21875859539745118, + "learning_rate": 0.00015625011460529935, + "loss": 0.8874, + "mean_token_accuracy": 0.7332236111164093, + "num_tokens": 55197126.0, + "step": 23860 + }, + { + "epoch": 0.2188502796369304, + "learning_rate": 0.0001562317777574035, + "loss": 0.8587, + "mean_token_accuracy": 0.7481783926486969, + "num_tokens": 55220566.0, + "step": 23870 + }, + { + "epoch": 0.21894196387640966, + "learning_rate": 0.00015621344090950768, + "loss": 0.8246, + "mean_token_accuracy": 0.7439969122409821, + "num_tokens": 55243504.0, + "step": 23880 + }, + { + "epoch": 0.21903364811588888, + "learning_rate": 0.00015619510406161182, + "loss": 0.8057, + "mean_token_accuracy": 0.7523382008075714, + "num_tokens": 55267123.0, + "step": 23890 + }, + { + "epoch": 0.2191253323553681, + "learning_rate": 0.00015617676721371596, + "loss": 0.8726, + "mean_token_accuracy": 0.7446614146232605, + "num_tokens": 55291060.0, + "step": 23900 + }, + { + "epoch": 0.21921701659484735, + "learning_rate": 0.00015615843036582012, + "loss": 0.89, + "mean_token_accuracy": 0.7387046813964844, + "num_tokens": 55314005.0, + "step": 23910 + }, + { + "epoch": 0.21930870083432658, + "learning_rate": 0.00015614009351792426, + "loss": 0.8486, + "mean_token_accuracy": 0.7483787298202514, + "num_tokens": 55336522.0, + "step": 23920 + }, + { + "epoch": 0.21940038507380583, + "learning_rate": 0.00015612175667002845, + "loss": 0.89, + "mean_token_accuracy": 0.728826767206192, + "num_tokens": 55360200.0, + "step": 23930 + }, + { + "epoch": 0.21949206931328505, + "learning_rate": 0.0001561034198221326, + "loss": 0.8282, + "mean_token_accuracy": 0.7571542203426361, + "num_tokens": 55383552.0, + "step": 23940 + }, + { + "epoch": 0.21958375355276427, + "learning_rate": 0.00015608508297423673, + "loss": 0.9024, + "mean_token_accuracy": 0.7327570796012879, + "num_tokens": 55406816.0, + "step": 23950 + }, + { + "epoch": 0.21967543779224352, + "learning_rate": 0.0001560667461263409, + "loss": 0.8751, + "mean_token_accuracy": 0.7369073569774628, + "num_tokens": 55429402.0, + "step": 23960 + }, + { + "epoch": 0.21976712203172274, + "learning_rate": 0.00015604840927844503, + "loss": 0.8308, + "mean_token_accuracy": 0.753199428319931, + "num_tokens": 55452121.0, + "step": 23970 + }, + { + "epoch": 0.21985880627120197, + "learning_rate": 0.0001560300724305492, + "loss": 0.8376, + "mean_token_accuracy": 0.750776594877243, + "num_tokens": 55476260.0, + "step": 23980 + }, + { + "epoch": 0.21995049051068122, + "learning_rate": 0.00015601173558265334, + "loss": 0.8573, + "mean_token_accuracy": 0.7445099115371704, + "num_tokens": 55499888.0, + "step": 23990 + }, + { + "epoch": 0.22004217475016044, + "learning_rate": 0.0001559933987347575, + "loss": 0.9013, + "mean_token_accuracy": 0.7359369695186615, + "num_tokens": 55522509.0, + "step": 24000 + }, + { + "epoch": 0.2201338589896397, + "learning_rate": 0.00015597506188686167, + "loss": 0.8315, + "mean_token_accuracy": 0.75285684466362, + "num_tokens": 55545077.0, + "step": 24010 + }, + { + "epoch": 0.22022554322911891, + "learning_rate": 0.0001559567250389658, + "loss": 0.8581, + "mean_token_accuracy": 0.7412333250045776, + "num_tokens": 55567446.0, + "step": 24020 + }, + { + "epoch": 0.22031722746859814, + "learning_rate": 0.00015593838819106997, + "loss": 0.8819, + "mean_token_accuracy": 0.7352995276451111, + "num_tokens": 55590440.0, + "step": 24030 + }, + { + "epoch": 0.2204089117080774, + "learning_rate": 0.0001559200513431741, + "loss": 0.8723, + "mean_token_accuracy": 0.7348103106021882, + "num_tokens": 55613620.0, + "step": 24040 + }, + { + "epoch": 0.2205005959475566, + "learning_rate": 0.00015590171449527827, + "loss": 0.8783, + "mean_token_accuracy": 0.7398612320423126, + "num_tokens": 55637043.0, + "step": 24050 + }, + { + "epoch": 0.22059228018703586, + "learning_rate": 0.0001558833776473824, + "loss": 0.8474, + "mean_token_accuracy": 0.745047253370285, + "num_tokens": 55659449.0, + "step": 24060 + }, + { + "epoch": 0.22068396442651508, + "learning_rate": 0.00015586504079948658, + "loss": 0.887, + "mean_token_accuracy": 0.7352611005306244, + "num_tokens": 55682019.0, + "step": 24070 + }, + { + "epoch": 0.2207756486659943, + "learning_rate": 0.00015584670395159074, + "loss": 0.8948, + "mean_token_accuracy": 0.7356932163238525, + "num_tokens": 55705342.0, + "step": 24080 + }, + { + "epoch": 0.22086733290547356, + "learning_rate": 0.00015582836710369488, + "loss": 0.8175, + "mean_token_accuracy": 0.7523733794689178, + "num_tokens": 55729072.0, + "step": 24090 + }, + { + "epoch": 0.22095901714495278, + "learning_rate": 0.00015581003025579902, + "loss": 0.8956, + "mean_token_accuracy": 0.7405926644802093, + "num_tokens": 55752285.0, + "step": 24100 + }, + { + "epoch": 0.221050701384432, + "learning_rate": 0.00015579169340790319, + "loss": 0.8438, + "mean_token_accuracy": 0.7390296995639801, + "num_tokens": 55774982.0, + "step": 24110 + }, + { + "epoch": 0.22114238562391125, + "learning_rate": 0.00015577335656000732, + "loss": 0.8418, + "mean_token_accuracy": 0.744842278957367, + "num_tokens": 55797962.0, + "step": 24120 + }, + { + "epoch": 0.22123406986339048, + "learning_rate": 0.00015575501971211152, + "loss": 0.8558, + "mean_token_accuracy": 0.7467646896839142, + "num_tokens": 55820234.0, + "step": 24130 + }, + { + "epoch": 0.22132575410286973, + "learning_rate": 0.00015573668286421565, + "loss": 0.8315, + "mean_token_accuracy": 0.7507136106491089, + "num_tokens": 55843204.0, + "step": 24140 + }, + { + "epoch": 0.22141743834234895, + "learning_rate": 0.0001557183460163198, + "loss": 0.8848, + "mean_token_accuracy": 0.7322293877601623, + "num_tokens": 55866244.0, + "step": 24150 + }, + { + "epoch": 0.22150912258182817, + "learning_rate": 0.00015570000916842396, + "loss": 0.8653, + "mean_token_accuracy": 0.740640789270401, + "num_tokens": 55888300.0, + "step": 24160 + }, + { + "epoch": 0.22160080682130742, + "learning_rate": 0.0001556816723205281, + "loss": 0.8638, + "mean_token_accuracy": 0.7410377204418183, + "num_tokens": 55911949.0, + "step": 24170 + }, + { + "epoch": 0.22169249106078665, + "learning_rate": 0.00015566333547263226, + "loss": 0.8805, + "mean_token_accuracy": 0.7393958389759063, + "num_tokens": 55935051.0, + "step": 24180 + }, + { + "epoch": 0.2217841753002659, + "learning_rate": 0.0001556449986247364, + "loss": 0.8588, + "mean_token_accuracy": 0.7424891471862793, + "num_tokens": 55957905.0, + "step": 24190 + }, + { + "epoch": 0.22187585953974512, + "learning_rate": 0.00015562666177684057, + "loss": 0.8742, + "mean_token_accuracy": 0.7418850660324097, + "num_tokens": 55981382.0, + "step": 24200 + }, + { + "epoch": 0.22196754377922434, + "learning_rate": 0.00015560832492894473, + "loss": 0.8508, + "mean_token_accuracy": 0.7461317777633667, + "num_tokens": 56004358.0, + "step": 24210 + }, + { + "epoch": 0.2220592280187036, + "learning_rate": 0.00015558998808104887, + "loss": 0.8637, + "mean_token_accuracy": 0.7400383591651917, + "num_tokens": 56027254.0, + "step": 24220 + }, + { + "epoch": 0.22215091225818281, + "learning_rate": 0.00015557165123315303, + "loss": 0.8915, + "mean_token_accuracy": 0.7401159465312958, + "num_tokens": 56050493.0, + "step": 24230 + }, + { + "epoch": 0.22224259649766206, + "learning_rate": 0.00015555331438525717, + "loss": 0.8385, + "mean_token_accuracy": 0.7505717515945435, + "num_tokens": 56074138.0, + "step": 24240 + }, + { + "epoch": 0.2223342807371413, + "learning_rate": 0.00015553497753736134, + "loss": 0.864, + "mean_token_accuracy": 0.7438802659511566, + "num_tokens": 56097304.0, + "step": 24250 + }, + { + "epoch": 0.2224259649766205, + "learning_rate": 0.0001555166406894655, + "loss": 0.8582, + "mean_token_accuracy": 0.7439675509929657, + "num_tokens": 56120300.0, + "step": 24260 + }, + { + "epoch": 0.22251764921609976, + "learning_rate": 0.00015549830384156964, + "loss": 0.84, + "mean_token_accuracy": 0.7437430799007416, + "num_tokens": 56143176.0, + "step": 24270 + }, + { + "epoch": 0.22260933345557898, + "learning_rate": 0.0001554799669936738, + "loss": 0.8819, + "mean_token_accuracy": 0.7356357038021087, + "num_tokens": 56166239.0, + "step": 24280 + }, + { + "epoch": 0.2227010176950582, + "learning_rate": 0.00015546163014577795, + "loss": 0.8847, + "mean_token_accuracy": 0.741468071937561, + "num_tokens": 56189490.0, + "step": 24290 + }, + { + "epoch": 0.22279270193453746, + "learning_rate": 0.00015544329329788208, + "loss": 0.8789, + "mean_token_accuracy": 0.7427528321743011, + "num_tokens": 56213041.0, + "step": 24300 + }, + { + "epoch": 0.22288438617401668, + "learning_rate": 0.00015542495644998625, + "loss": 0.88, + "mean_token_accuracy": 0.7418298780918121, + "num_tokens": 56236414.0, + "step": 24310 + }, + { + "epoch": 0.22297607041349593, + "learning_rate": 0.0001554066196020904, + "loss": 0.8399, + "mean_token_accuracy": 0.7472315311431885, + "num_tokens": 56259296.0, + "step": 24320 + }, + { + "epoch": 0.22306775465297515, + "learning_rate": 0.00015538828275419458, + "loss": 0.8759, + "mean_token_accuracy": 0.7376609802246094, + "num_tokens": 56282709.0, + "step": 24330 + }, + { + "epoch": 0.22315943889245438, + "learning_rate": 0.00015536994590629872, + "loss": 0.8295, + "mean_token_accuracy": 0.7500767946243286, + "num_tokens": 56305399.0, + "step": 24340 + }, + { + "epoch": 0.22325112313193363, + "learning_rate": 0.00015535160905840286, + "loss": 0.8399, + "mean_token_accuracy": 0.7495501339435577, + "num_tokens": 56329027.0, + "step": 24350 + }, + { + "epoch": 0.22334280737141285, + "learning_rate": 0.00015533327221050702, + "loss": 0.8577, + "mean_token_accuracy": 0.747114610671997, + "num_tokens": 56352401.0, + "step": 24360 + }, + { + "epoch": 0.2234344916108921, + "learning_rate": 0.00015531493536261116, + "loss": 0.8055, + "mean_token_accuracy": 0.7586235523223877, + "num_tokens": 56375613.0, + "step": 24370 + }, + { + "epoch": 0.22352617585037132, + "learning_rate": 0.00015529659851471533, + "loss": 0.869, + "mean_token_accuracy": 0.7420877635478973, + "num_tokens": 56398680.0, + "step": 24380 + }, + { + "epoch": 0.22361786008985055, + "learning_rate": 0.0001552782616668195, + "loss": 0.8528, + "mean_token_accuracy": 0.7443232476711273, + "num_tokens": 56422318.0, + "step": 24390 + }, + { + "epoch": 0.2237095443293298, + "learning_rate": 0.00015525992481892363, + "loss": 0.8817, + "mean_token_accuracy": 0.74188734292984, + "num_tokens": 56445584.0, + "step": 24400 + }, + { + "epoch": 0.22380122856880902, + "learning_rate": 0.0001552415879710278, + "loss": 0.8649, + "mean_token_accuracy": 0.7461014330387116, + "num_tokens": 56469280.0, + "step": 24410 + }, + { + "epoch": 0.22389291280828824, + "learning_rate": 0.00015522325112313193, + "loss": 0.843, + "mean_token_accuracy": 0.7505100846290589, + "num_tokens": 56492747.0, + "step": 24420 + }, + { + "epoch": 0.2239845970477675, + "learning_rate": 0.0001552049142752361, + "loss": 0.8634, + "mean_token_accuracy": 0.7417403936386109, + "num_tokens": 56516060.0, + "step": 24430 + }, + { + "epoch": 0.22407628128724671, + "learning_rate": 0.00015518657742734024, + "loss": 0.8728, + "mean_token_accuracy": 0.7434927344322204, + "num_tokens": 56539230.0, + "step": 24440 + }, + { + "epoch": 0.22416796552672597, + "learning_rate": 0.0001551682405794444, + "loss": 0.8751, + "mean_token_accuracy": 0.7428310811519623, + "num_tokens": 56561651.0, + "step": 24450 + }, + { + "epoch": 0.2242596497662052, + "learning_rate": 0.00015514990373154857, + "loss": 0.8644, + "mean_token_accuracy": 0.7391244351863862, + "num_tokens": 56584795.0, + "step": 24460 + }, + { + "epoch": 0.2243513340056844, + "learning_rate": 0.0001551315668836527, + "loss": 0.8515, + "mean_token_accuracy": 0.7435534298419952, + "num_tokens": 56607654.0, + "step": 24470 + }, + { + "epoch": 0.22444301824516366, + "learning_rate": 0.00015511323003575687, + "loss": 0.8542, + "mean_token_accuracy": 0.743599671125412, + "num_tokens": 56631807.0, + "step": 24480 + }, + { + "epoch": 0.22453470248464288, + "learning_rate": 0.000155094893187861, + "loss": 0.8604, + "mean_token_accuracy": 0.7444347977638245, + "num_tokens": 56655863.0, + "step": 24490 + }, + { + "epoch": 0.22462638672412213, + "learning_rate": 0.00015507655633996515, + "loss": 0.8759, + "mean_token_accuracy": 0.7387280941009522, + "num_tokens": 56678861.0, + "step": 24500 + }, + { + "epoch": 0.22471807096360136, + "learning_rate": 0.00015505821949206931, + "loss": 0.8874, + "mean_token_accuracy": 0.7401228547096252, + "num_tokens": 56702575.0, + "step": 24510 + }, + { + "epoch": 0.22480975520308058, + "learning_rate": 0.00015503988264417348, + "loss": 0.8294, + "mean_token_accuracy": 0.7471656143665314, + "num_tokens": 56725452.0, + "step": 24520 + }, + { + "epoch": 0.22490143944255983, + "learning_rate": 0.00015502154579627764, + "loss": 0.8424, + "mean_token_accuracy": 0.7398037910461426, + "num_tokens": 56748631.0, + "step": 24530 + }, + { + "epoch": 0.22499312368203905, + "learning_rate": 0.00015500320894838178, + "loss": 0.8798, + "mean_token_accuracy": 0.7348233699798584, + "num_tokens": 56771624.0, + "step": 24540 + }, + { + "epoch": 0.2250848079215183, + "learning_rate": 0.00015498487210048592, + "loss": 0.8239, + "mean_token_accuracy": 0.7494547724723816, + "num_tokens": 56794665.0, + "step": 24550 + }, + { + "epoch": 0.22517649216099753, + "learning_rate": 0.0001549665352525901, + "loss": 0.8837, + "mean_token_accuracy": 0.7364970028400422, + "num_tokens": 56817625.0, + "step": 24560 + }, + { + "epoch": 0.22526817640047675, + "learning_rate": 0.00015494819840469423, + "loss": 0.8248, + "mean_token_accuracy": 0.7507057189941406, + "num_tokens": 56840334.0, + "step": 24570 + }, + { + "epoch": 0.225359860639956, + "learning_rate": 0.0001549298615567984, + "loss": 0.8114, + "mean_token_accuracy": 0.7491330444812775, + "num_tokens": 56863710.0, + "step": 24580 + }, + { + "epoch": 0.22545154487943522, + "learning_rate": 0.00015491152470890256, + "loss": 0.8821, + "mean_token_accuracy": 0.7415892958641053, + "num_tokens": 56886699.0, + "step": 24590 + }, + { + "epoch": 0.22554322911891445, + "learning_rate": 0.0001548931878610067, + "loss": 0.8379, + "mean_token_accuracy": 0.7512984931468963, + "num_tokens": 56909298.0, + "step": 24600 + }, + { + "epoch": 0.2256349133583937, + "learning_rate": 0.00015487485101311086, + "loss": 0.8739, + "mean_token_accuracy": 0.7323919415473938, + "num_tokens": 56933073.0, + "step": 24610 + }, + { + "epoch": 0.22572659759787292, + "learning_rate": 0.000154856514165215, + "loss": 0.85, + "mean_token_accuracy": 0.7439683377742767, + "num_tokens": 56956139.0, + "step": 24620 + }, + { + "epoch": 0.22581828183735217, + "learning_rate": 0.00015483817731731916, + "loss": 0.8689, + "mean_token_accuracy": 0.7440510332584381, + "num_tokens": 56979088.0, + "step": 24630 + }, + { + "epoch": 0.2259099660768314, + "learning_rate": 0.0001548198404694233, + "loss": 0.8657, + "mean_token_accuracy": 0.7423623442649842, + "num_tokens": 57002535.0, + "step": 24640 + }, + { + "epoch": 0.22600165031631061, + "learning_rate": 0.00015480150362152747, + "loss": 0.8944, + "mean_token_accuracy": 0.7390952825546264, + "num_tokens": 57025765.0, + "step": 24650 + }, + { + "epoch": 0.22609333455578987, + "learning_rate": 0.00015478316677363163, + "loss": 0.8493, + "mean_token_accuracy": 0.7484005272388459, + "num_tokens": 57048734.0, + "step": 24660 + }, + { + "epoch": 0.2261850187952691, + "learning_rate": 0.00015476482992573577, + "loss": 0.8722, + "mean_token_accuracy": 0.736942982673645, + "num_tokens": 57071929.0, + "step": 24670 + }, + { + "epoch": 0.22627670303474834, + "learning_rate": 0.00015474649307783994, + "loss": 0.8824, + "mean_token_accuracy": 0.7420193493366242, + "num_tokens": 57095542.0, + "step": 24680 + }, + { + "epoch": 0.22636838727422756, + "learning_rate": 0.00015472815622994407, + "loss": 0.8378, + "mean_token_accuracy": 0.7449758231639863, + "num_tokens": 57118565.0, + "step": 24690 + }, + { + "epoch": 0.22646007151370678, + "learning_rate": 0.00015470981938204824, + "loss": 0.8741, + "mean_token_accuracy": 0.7404014468193054, + "num_tokens": 57141420.0, + "step": 24700 + }, + { + "epoch": 0.22655175575318603, + "learning_rate": 0.00015469148253415238, + "loss": 0.8519, + "mean_token_accuracy": 0.7445592880249023, + "num_tokens": 57164619.0, + "step": 24710 + }, + { + "epoch": 0.22664343999266526, + "learning_rate": 0.00015467314568625654, + "loss": 0.862, + "mean_token_accuracy": 0.7371529340744019, + "num_tokens": 57188234.0, + "step": 24720 + }, + { + "epoch": 0.2267351242321445, + "learning_rate": 0.0001546548088383607, + "loss": 0.8964, + "mean_token_accuracy": 0.735043853521347, + "num_tokens": 57211321.0, + "step": 24730 + }, + { + "epoch": 0.22682680847162373, + "learning_rate": 0.00015463647199046485, + "loss": 0.8483, + "mean_token_accuracy": 0.7475723206996918, + "num_tokens": 57234545.0, + "step": 24740 + }, + { + "epoch": 0.22691849271110295, + "learning_rate": 0.00015461813514256899, + "loss": 0.8822, + "mean_token_accuracy": 0.7385982275009155, + "num_tokens": 57257569.0, + "step": 24750 + }, + { + "epoch": 0.2270101769505822, + "learning_rate": 0.00015459979829467315, + "loss": 0.8638, + "mean_token_accuracy": 0.742702966928482, + "num_tokens": 57279975.0, + "step": 24760 + }, + { + "epoch": 0.22710186119006143, + "learning_rate": 0.0001545814614467773, + "loss": 0.8544, + "mean_token_accuracy": 0.7445092737674713, + "num_tokens": 57303376.0, + "step": 24770 + }, + { + "epoch": 0.22719354542954065, + "learning_rate": 0.00015456312459888148, + "loss": 0.8751, + "mean_token_accuracy": 0.7360867619514465, + "num_tokens": 57326850.0, + "step": 24780 + }, + { + "epoch": 0.2272852296690199, + "learning_rate": 0.00015454478775098562, + "loss": 0.8735, + "mean_token_accuracy": 0.7465667426586151, + "num_tokens": 57350406.0, + "step": 24790 + }, + { + "epoch": 0.22737691390849912, + "learning_rate": 0.00015452645090308976, + "loss": 0.8577, + "mean_token_accuracy": 0.7381657600402832, + "num_tokens": 57373930.0, + "step": 24800 + }, + { + "epoch": 0.22746859814797837, + "learning_rate": 0.00015450811405519392, + "loss": 0.866, + "mean_token_accuracy": 0.7426710903644562, + "num_tokens": 57397601.0, + "step": 24810 + }, + { + "epoch": 0.2275602823874576, + "learning_rate": 0.00015448977720729806, + "loss": 0.8336, + "mean_token_accuracy": 0.7462375402450562, + "num_tokens": 57420395.0, + "step": 24820 + }, + { + "epoch": 0.22765196662693682, + "learning_rate": 0.00015447144035940223, + "loss": 0.827, + "mean_token_accuracy": 0.746272224187851, + "num_tokens": 57443718.0, + "step": 24830 + }, + { + "epoch": 0.22774365086641607, + "learning_rate": 0.00015445310351150637, + "loss": 0.8658, + "mean_token_accuracy": 0.7406410813331604, + "num_tokens": 57467203.0, + "step": 24840 + }, + { + "epoch": 0.2278353351058953, + "learning_rate": 0.00015443476666361053, + "loss": 0.8351, + "mean_token_accuracy": 0.748191624879837, + "num_tokens": 57490304.0, + "step": 24850 + }, + { + "epoch": 0.22792701934537454, + "learning_rate": 0.0001544164298157147, + "loss": 0.8645, + "mean_token_accuracy": 0.74213125705719, + "num_tokens": 57513518.0, + "step": 24860 + }, + { + "epoch": 0.22801870358485377, + "learning_rate": 0.00015439809296781884, + "loss": 0.8404, + "mean_token_accuracy": 0.7463255822658539, + "num_tokens": 57536445.0, + "step": 24870 + }, + { + "epoch": 0.228110387824333, + "learning_rate": 0.000154379756119923, + "loss": 0.9032, + "mean_token_accuracy": 0.7351026475429535, + "num_tokens": 57559747.0, + "step": 24880 + }, + { + "epoch": 0.22820207206381224, + "learning_rate": 0.00015436141927202714, + "loss": 0.8471, + "mean_token_accuracy": 0.748066633939743, + "num_tokens": 57581966.0, + "step": 24890 + }, + { + "epoch": 0.22829375630329146, + "learning_rate": 0.0001543430824241313, + "loss": 0.8504, + "mean_token_accuracy": 0.7467912256717681, + "num_tokens": 57604905.0, + "step": 24900 + }, + { + "epoch": 0.22838544054277068, + "learning_rate": 0.00015432474557623547, + "loss": 0.8875, + "mean_token_accuracy": 0.7365090548992157, + "num_tokens": 57628518.0, + "step": 24910 + }, + { + "epoch": 0.22847712478224994, + "learning_rate": 0.0001543064087283396, + "loss": 0.871, + "mean_token_accuracy": 0.7403376162052154, + "num_tokens": 57651665.0, + "step": 24920 + }, + { + "epoch": 0.22856880902172916, + "learning_rate": 0.00015428807188044377, + "loss": 0.8711, + "mean_token_accuracy": 0.7411530137062072, + "num_tokens": 57674991.0, + "step": 24930 + }, + { + "epoch": 0.2286604932612084, + "learning_rate": 0.0001542697350325479, + "loss": 0.843, + "mean_token_accuracy": 0.7386019885540008, + "num_tokens": 57698144.0, + "step": 24940 + }, + { + "epoch": 0.22875217750068763, + "learning_rate": 0.00015425139818465205, + "loss": 0.8329, + "mean_token_accuracy": 0.7490780770778656, + "num_tokens": 57721894.0, + "step": 24950 + }, + { + "epoch": 0.22884386174016685, + "learning_rate": 0.00015423306133675622, + "loss": 0.8425, + "mean_token_accuracy": 0.7458144187927246, + "num_tokens": 57744725.0, + "step": 24960 + }, + { + "epoch": 0.2289355459796461, + "learning_rate": 0.00015421472448886035, + "loss": 0.8907, + "mean_token_accuracy": 0.7429078042507171, + "num_tokens": 57768097.0, + "step": 24970 + }, + { + "epoch": 0.22902723021912533, + "learning_rate": 0.00015419638764096455, + "loss": 0.8581, + "mean_token_accuracy": 0.7372221231460572, + "num_tokens": 57790831.0, + "step": 24980 + }, + { + "epoch": 0.22911891445860458, + "learning_rate": 0.00015417805079306869, + "loss": 0.8831, + "mean_token_accuracy": 0.737917172908783, + "num_tokens": 57813922.0, + "step": 24990 + }, + { + "epoch": 0.2292105986980838, + "learning_rate": 0.00015415971394517282, + "loss": 0.8627, + "mean_token_accuracy": 0.7416988790035248, + "num_tokens": 57837143.0, + "step": 25000 + }, + { + "epoch": 0.22930228293756302, + "learning_rate": 0.000154141377097277, + "loss": 0.9013, + "mean_token_accuracy": 0.7348793506622314, + "num_tokens": 57859442.0, + "step": 25010 + }, + { + "epoch": 0.22939396717704227, + "learning_rate": 0.00015412304024938113, + "loss": 0.8776, + "mean_token_accuracy": 0.7403935253620147, + "num_tokens": 57882885.0, + "step": 25020 + }, + { + "epoch": 0.2294856514165215, + "learning_rate": 0.0001541047034014853, + "loss": 0.8858, + "mean_token_accuracy": 0.7390576839447022, + "num_tokens": 57905922.0, + "step": 25030 + }, + { + "epoch": 0.22957733565600075, + "learning_rate": 0.00015408636655358946, + "loss": 0.8351, + "mean_token_accuracy": 0.7414995014667511, + "num_tokens": 57928918.0, + "step": 25040 + }, + { + "epoch": 0.22966901989547997, + "learning_rate": 0.0001540680297056936, + "loss": 0.8782, + "mean_token_accuracy": 0.7407548666000366, + "num_tokens": 57951626.0, + "step": 25050 + }, + { + "epoch": 0.2297607041349592, + "learning_rate": 0.00015404969285779776, + "loss": 0.8767, + "mean_token_accuracy": 0.735957533121109, + "num_tokens": 57975618.0, + "step": 25060 + }, + { + "epoch": 0.22985238837443844, + "learning_rate": 0.0001540313560099019, + "loss": 0.8424, + "mean_token_accuracy": 0.7482416808605195, + "num_tokens": 57998609.0, + "step": 25070 + }, + { + "epoch": 0.22994407261391767, + "learning_rate": 0.00015401301916200607, + "loss": 0.8899, + "mean_token_accuracy": 0.735405319929123, + "num_tokens": 58021340.0, + "step": 25080 + }, + { + "epoch": 0.2300357568533969, + "learning_rate": 0.0001539946823141102, + "loss": 0.8619, + "mean_token_accuracy": 0.7451351046562195, + "num_tokens": 58044855.0, + "step": 25090 + }, + { + "epoch": 0.23012744109287614, + "learning_rate": 0.00015397634546621437, + "loss": 0.8689, + "mean_token_accuracy": 0.7421709656715393, + "num_tokens": 58067997.0, + "step": 25100 + }, + { + "epoch": 0.23021912533235536, + "learning_rate": 0.00015395800861831853, + "loss": 0.8743, + "mean_token_accuracy": 0.7373112738132477, + "num_tokens": 58091078.0, + "step": 25110 + }, + { + "epoch": 0.2303108095718346, + "learning_rate": 0.00015393967177042267, + "loss": 0.8873, + "mean_token_accuracy": 0.738627690076828, + "num_tokens": 58114277.0, + "step": 25120 + }, + { + "epoch": 0.23040249381131384, + "learning_rate": 0.00015392133492252684, + "loss": 0.8799, + "mean_token_accuracy": 0.7405313074588775, + "num_tokens": 58137929.0, + "step": 25130 + }, + { + "epoch": 0.23049417805079306, + "learning_rate": 0.00015390299807463098, + "loss": 0.9035, + "mean_token_accuracy": 0.7274326145648956, + "num_tokens": 58160912.0, + "step": 25140 + }, + { + "epoch": 0.2305858622902723, + "learning_rate": 0.00015388466122673511, + "loss": 0.843, + "mean_token_accuracy": 0.7468173027038574, + "num_tokens": 58183086.0, + "step": 25150 + }, + { + "epoch": 0.23067754652975153, + "learning_rate": 0.00015386632437883928, + "loss": 0.8665, + "mean_token_accuracy": 0.7416611790657044, + "num_tokens": 58206392.0, + "step": 25160 + }, + { + "epoch": 0.23076923076923078, + "learning_rate": 0.00015384798753094345, + "loss": 0.8508, + "mean_token_accuracy": 0.7480005204677582, + "num_tokens": 58229758.0, + "step": 25170 + }, + { + "epoch": 0.23086091500871, + "learning_rate": 0.0001538296506830476, + "loss": 0.8819, + "mean_token_accuracy": 0.7375615358352661, + "num_tokens": 58252065.0, + "step": 25180 + }, + { + "epoch": 0.23095259924818923, + "learning_rate": 0.00015381131383515175, + "loss": 0.8661, + "mean_token_accuracy": 0.7426708579063416, + "num_tokens": 58276073.0, + "step": 25190 + }, + { + "epoch": 0.23104428348766848, + "learning_rate": 0.0001537929769872559, + "loss": 0.9221, + "mean_token_accuracy": 0.7264938712120056, + "num_tokens": 58299222.0, + "step": 25200 + }, + { + "epoch": 0.2311359677271477, + "learning_rate": 0.00015377464013936005, + "loss": 0.8452, + "mean_token_accuracy": 0.7471257090568543, + "num_tokens": 58321658.0, + "step": 25210 + }, + { + "epoch": 0.23122765196662692, + "learning_rate": 0.0001537563032914642, + "loss": 0.8753, + "mean_token_accuracy": 0.7433595061302185, + "num_tokens": 58344246.0, + "step": 25220 + }, + { + "epoch": 0.23131933620610617, + "learning_rate": 0.00015373796644356836, + "loss": 0.8606, + "mean_token_accuracy": 0.7436851263046265, + "num_tokens": 58367350.0, + "step": 25230 + }, + { + "epoch": 0.2314110204455854, + "learning_rate": 0.00015371962959567252, + "loss": 0.8295, + "mean_token_accuracy": 0.7513671100139618, + "num_tokens": 58390349.0, + "step": 25240 + }, + { + "epoch": 0.23150270468506465, + "learning_rate": 0.00015370129274777666, + "loss": 0.8625, + "mean_token_accuracy": 0.7378962755203247, + "num_tokens": 58413732.0, + "step": 25250 + }, + { + "epoch": 0.23159438892454387, + "learning_rate": 0.00015368295589988083, + "loss": 0.8173, + "mean_token_accuracy": 0.7515727698802948, + "num_tokens": 58436637.0, + "step": 25260 + }, + { + "epoch": 0.2316860731640231, + "learning_rate": 0.00015366461905198496, + "loss": 0.8461, + "mean_token_accuracy": 0.7481701791286468, + "num_tokens": 58459711.0, + "step": 25270 + }, + { + "epoch": 0.23177775740350234, + "learning_rate": 0.00015364628220408913, + "loss": 0.8758, + "mean_token_accuracy": 0.7404216885566711, + "num_tokens": 58482154.0, + "step": 25280 + }, + { + "epoch": 0.23186944164298157, + "learning_rate": 0.00015362794535619327, + "loss": 0.8634, + "mean_token_accuracy": 0.7502171277999878, + "num_tokens": 58505395.0, + "step": 25290 + }, + { + "epoch": 0.23196112588246082, + "learning_rate": 0.00015360960850829743, + "loss": 0.8883, + "mean_token_accuracy": 0.7388078510761261, + "num_tokens": 58528371.0, + "step": 25300 + }, + { + "epoch": 0.23205281012194004, + "learning_rate": 0.0001535912716604016, + "loss": 0.8237, + "mean_token_accuracy": 0.747081845998764, + "num_tokens": 58551990.0, + "step": 25310 + }, + { + "epoch": 0.23214449436141926, + "learning_rate": 0.00015357293481250574, + "loss": 0.8552, + "mean_token_accuracy": 0.7440243124961853, + "num_tokens": 58574792.0, + "step": 25320 + }, + { + "epoch": 0.2322361786008985, + "learning_rate": 0.0001535545979646099, + "loss": 0.8504, + "mean_token_accuracy": 0.7496018052101135, + "num_tokens": 58596797.0, + "step": 25330 + }, + { + "epoch": 0.23232786284037774, + "learning_rate": 0.00015353626111671404, + "loss": 0.8148, + "mean_token_accuracy": 0.7489557206630707, + "num_tokens": 58619683.0, + "step": 25340 + }, + { + "epoch": 0.232419547079857, + "learning_rate": 0.00015351792426881818, + "loss": 0.8492, + "mean_token_accuracy": 0.7465729355812073, + "num_tokens": 58642595.0, + "step": 25350 + }, + { + "epoch": 0.2325112313193362, + "learning_rate": 0.00015349958742092234, + "loss": 0.8488, + "mean_token_accuracy": 0.7383763372898102, + "num_tokens": 58665394.0, + "step": 25360 + }, + { + "epoch": 0.23260291555881543, + "learning_rate": 0.0001534812505730265, + "loss": 0.8403, + "mean_token_accuracy": 0.7497602224349975, + "num_tokens": 58688035.0, + "step": 25370 + }, + { + "epoch": 0.23269459979829468, + "learning_rate": 0.00015346291372513068, + "loss": 0.8458, + "mean_token_accuracy": 0.7423629879951477, + "num_tokens": 58711086.0, + "step": 25380 + }, + { + "epoch": 0.2327862840377739, + "learning_rate": 0.00015344457687723481, + "loss": 0.847, + "mean_token_accuracy": 0.7445569574832916, + "num_tokens": 58733477.0, + "step": 25390 + }, + { + "epoch": 0.23287796827725313, + "learning_rate": 0.00015342624002933895, + "loss": 0.8638, + "mean_token_accuracy": 0.7452936112880707, + "num_tokens": 58757107.0, + "step": 25400 + }, + { + "epoch": 0.23296965251673238, + "learning_rate": 0.00015340790318144312, + "loss": 0.8601, + "mean_token_accuracy": 0.741677588224411, + "num_tokens": 58780288.0, + "step": 25410 + }, + { + "epoch": 0.2330613367562116, + "learning_rate": 0.00015338956633354726, + "loss": 0.8434, + "mean_token_accuracy": 0.7475954532623291, + "num_tokens": 58803007.0, + "step": 25420 + }, + { + "epoch": 0.23315302099569085, + "learning_rate": 0.00015337122948565142, + "loss": 0.84, + "mean_token_accuracy": 0.7521816074848175, + "num_tokens": 58825954.0, + "step": 25430 + }, + { + "epoch": 0.23324470523517007, + "learning_rate": 0.0001533528926377556, + "loss": 0.8641, + "mean_token_accuracy": 0.7487018287181855, + "num_tokens": 58848635.0, + "step": 25440 + }, + { + "epoch": 0.2333363894746493, + "learning_rate": 0.00015333455578985973, + "loss": 0.8517, + "mean_token_accuracy": 0.7424684166908264, + "num_tokens": 58872077.0, + "step": 25450 + }, + { + "epoch": 0.23342807371412855, + "learning_rate": 0.0001533162189419639, + "loss": 0.8704, + "mean_token_accuracy": 0.7372147023677826, + "num_tokens": 58894889.0, + "step": 25460 + }, + { + "epoch": 0.23351975795360777, + "learning_rate": 0.00015329788209406803, + "loss": 0.8654, + "mean_token_accuracy": 0.7474406838417054, + "num_tokens": 58918355.0, + "step": 25470 + }, + { + "epoch": 0.23361144219308702, + "learning_rate": 0.0001532795452461722, + "loss": 0.8816, + "mean_token_accuracy": 0.744608473777771, + "num_tokens": 58941341.0, + "step": 25480 + }, + { + "epoch": 0.23370312643256624, + "learning_rate": 0.00015326120839827633, + "loss": 0.9057, + "mean_token_accuracy": 0.7318639755249023, + "num_tokens": 58964375.0, + "step": 25490 + }, + { + "epoch": 0.23379481067204547, + "learning_rate": 0.0001532428715503805, + "loss": 0.8484, + "mean_token_accuracy": 0.7439403295516968, + "num_tokens": 58988214.0, + "step": 25500 + }, + { + "epoch": 0.23388649491152472, + "learning_rate": 0.00015322453470248466, + "loss": 0.8057, + "mean_token_accuracy": 0.7566617786884308, + "num_tokens": 59010918.0, + "step": 25510 + }, + { + "epoch": 0.23397817915100394, + "learning_rate": 0.0001532061978545888, + "loss": 0.835, + "mean_token_accuracy": 0.7533825874328614, + "num_tokens": 59034500.0, + "step": 25520 + }, + { + "epoch": 0.23406986339048316, + "learning_rate": 0.00015318786100669297, + "loss": 0.8614, + "mean_token_accuracy": 0.74126296043396, + "num_tokens": 59057221.0, + "step": 25530 + }, + { + "epoch": 0.2341615476299624, + "learning_rate": 0.0001531695241587971, + "loss": 0.8587, + "mean_token_accuracy": 0.7496389210224151, + "num_tokens": 59080168.0, + "step": 25540 + }, + { + "epoch": 0.23425323186944164, + "learning_rate": 0.00015315118731090124, + "loss": 0.854, + "mean_token_accuracy": 0.7466756463050842, + "num_tokens": 59103732.0, + "step": 25550 + }, + { + "epoch": 0.2343449161089209, + "learning_rate": 0.0001531328504630054, + "loss": 0.8872, + "mean_token_accuracy": 0.7361054718494415, + "num_tokens": 59127703.0, + "step": 25560 + }, + { + "epoch": 0.2344366003484001, + "learning_rate": 0.00015311451361510957, + "loss": 0.8779, + "mean_token_accuracy": 0.7358223915100097, + "num_tokens": 59150810.0, + "step": 25570 + }, + { + "epoch": 0.23452828458787933, + "learning_rate": 0.00015309617676721374, + "loss": 0.8278, + "mean_token_accuracy": 0.7478847682476044, + "num_tokens": 59173205.0, + "step": 25580 + }, + { + "epoch": 0.23461996882735858, + "learning_rate": 0.00015307783991931788, + "loss": 0.8674, + "mean_token_accuracy": 0.7413980424404144, + "num_tokens": 59196150.0, + "step": 25590 + }, + { + "epoch": 0.2347116530668378, + "learning_rate": 0.00015305950307142202, + "loss": 0.8171, + "mean_token_accuracy": 0.7523119330406189, + "num_tokens": 59218947.0, + "step": 25600 + }, + { + "epoch": 0.23480333730631706, + "learning_rate": 0.00015304116622352618, + "loss": 0.8652, + "mean_token_accuracy": 0.746193128824234, + "num_tokens": 59242644.0, + "step": 25610 + }, + { + "epoch": 0.23489502154579628, + "learning_rate": 0.00015302282937563032, + "loss": 0.7993, + "mean_token_accuracy": 0.7595108270645141, + "num_tokens": 59266159.0, + "step": 25620 + }, + { + "epoch": 0.2349867057852755, + "learning_rate": 0.0001530044925277345, + "loss": 0.8521, + "mean_token_accuracy": 0.7411499857902527, + "num_tokens": 59288880.0, + "step": 25630 + }, + { + "epoch": 0.23507839002475475, + "learning_rate": 0.00015298615567983865, + "loss": 0.8639, + "mean_token_accuracy": 0.7382328033447265, + "num_tokens": 59311283.0, + "step": 25640 + }, + { + "epoch": 0.23517007426423397, + "learning_rate": 0.0001529678188319428, + "loss": 0.8174, + "mean_token_accuracy": 0.7555031061172486, + "num_tokens": 59335183.0, + "step": 25650 + }, + { + "epoch": 0.23526175850371323, + "learning_rate": 0.00015294948198404696, + "loss": 0.8882, + "mean_token_accuracy": 0.7349155366420745, + "num_tokens": 59357863.0, + "step": 25660 + }, + { + "epoch": 0.23535344274319245, + "learning_rate": 0.0001529311451361511, + "loss": 0.8725, + "mean_token_accuracy": 0.7460060000419617, + "num_tokens": 59381002.0, + "step": 25670 + }, + { + "epoch": 0.23544512698267167, + "learning_rate": 0.00015291280828825526, + "loss": 0.8683, + "mean_token_accuracy": 0.7456463515758515, + "num_tokens": 59404668.0, + "step": 25680 + }, + { + "epoch": 0.23553681122215092, + "learning_rate": 0.0001528944714403594, + "loss": 0.8966, + "mean_token_accuracy": 0.7353382349014282, + "num_tokens": 59427709.0, + "step": 25690 + }, + { + "epoch": 0.23562849546163014, + "learning_rate": 0.00015287613459246356, + "loss": 0.8186, + "mean_token_accuracy": 0.754264110326767, + "num_tokens": 59450281.0, + "step": 25700 + }, + { + "epoch": 0.23572017970110937, + "learning_rate": 0.00015285779774456773, + "loss": 0.8902, + "mean_token_accuracy": 0.7390115857124329, + "num_tokens": 59473837.0, + "step": 25710 + }, + { + "epoch": 0.23581186394058862, + "learning_rate": 0.00015283946089667187, + "loss": 0.899, + "mean_token_accuracy": 0.7373830497264862, + "num_tokens": 59497061.0, + "step": 25720 + }, + { + "epoch": 0.23590354818006784, + "learning_rate": 0.00015282112404877603, + "loss": 0.8389, + "mean_token_accuracy": 0.7503412425518036, + "num_tokens": 59519429.0, + "step": 25730 + }, + { + "epoch": 0.2359952324195471, + "learning_rate": 0.00015280278720088017, + "loss": 0.8614, + "mean_token_accuracy": 0.7404552578926087, + "num_tokens": 59542369.0, + "step": 25740 + }, + { + "epoch": 0.2360869166590263, + "learning_rate": 0.0001527844503529843, + "loss": 0.8885, + "mean_token_accuracy": 0.7375787854194641, + "num_tokens": 59566727.0, + "step": 25750 + }, + { + "epoch": 0.23617860089850554, + "learning_rate": 0.0001527661135050885, + "loss": 0.8165, + "mean_token_accuracy": 0.7525578200817108, + "num_tokens": 59589340.0, + "step": 25760 + }, + { + "epoch": 0.2362702851379848, + "learning_rate": 0.00015274777665719264, + "loss": 0.8746, + "mean_token_accuracy": 0.7354776978492736, + "num_tokens": 59612169.0, + "step": 25770 + }, + { + "epoch": 0.236361969377464, + "learning_rate": 0.0001527294398092968, + "loss": 0.8589, + "mean_token_accuracy": 0.7442165195941925, + "num_tokens": 59634687.0, + "step": 25780 + }, + { + "epoch": 0.23645365361694326, + "learning_rate": 0.00015271110296140094, + "loss": 0.8416, + "mean_token_accuracy": 0.7429732918739319, + "num_tokens": 59657665.0, + "step": 25790 + }, + { + "epoch": 0.23654533785642248, + "learning_rate": 0.00015269276611350508, + "loss": 0.8892, + "mean_token_accuracy": 0.7356120705604553, + "num_tokens": 59680038.0, + "step": 25800 + }, + { + "epoch": 0.2366370220959017, + "learning_rate": 0.00015267442926560925, + "loss": 0.8803, + "mean_token_accuracy": 0.7332807183265686, + "num_tokens": 59703503.0, + "step": 25810 + }, + { + "epoch": 0.23672870633538096, + "learning_rate": 0.00015265609241771338, + "loss": 0.843, + "mean_token_accuracy": 0.7459983766078949, + "num_tokens": 59726455.0, + "step": 25820 + }, + { + "epoch": 0.23682039057486018, + "learning_rate": 0.00015263775556981758, + "loss": 0.8394, + "mean_token_accuracy": 0.7493344068527221, + "num_tokens": 59749853.0, + "step": 25830 + }, + { + "epoch": 0.2369120748143394, + "learning_rate": 0.00015261941872192172, + "loss": 0.8375, + "mean_token_accuracy": 0.7432567596435546, + "num_tokens": 59772394.0, + "step": 25840 + }, + { + "epoch": 0.23700375905381865, + "learning_rate": 0.00015260108187402585, + "loss": 0.8616, + "mean_token_accuracy": 0.7459872603416443, + "num_tokens": 59795906.0, + "step": 25850 + }, + { + "epoch": 0.23709544329329788, + "learning_rate": 0.00015258274502613002, + "loss": 0.8648, + "mean_token_accuracy": 0.740733414888382, + "num_tokens": 59818436.0, + "step": 25860 + }, + { + "epoch": 0.23718712753277713, + "learning_rate": 0.00015256440817823416, + "loss": 0.8277, + "mean_token_accuracy": 0.7478637576103211, + "num_tokens": 59842154.0, + "step": 25870 + }, + { + "epoch": 0.23727881177225635, + "learning_rate": 0.00015254607133033832, + "loss": 0.9151, + "mean_token_accuracy": 0.7274119138717652, + "num_tokens": 59864635.0, + "step": 25880 + }, + { + "epoch": 0.23737049601173557, + "learning_rate": 0.0001525277344824425, + "loss": 0.8764, + "mean_token_accuracy": 0.7428054809570312, + "num_tokens": 59888780.0, + "step": 25890 + }, + { + "epoch": 0.23746218025121482, + "learning_rate": 0.00015250939763454663, + "loss": 0.8731, + "mean_token_accuracy": 0.7317515194416047, + "num_tokens": 59912268.0, + "step": 25900 + }, + { + "epoch": 0.23755386449069404, + "learning_rate": 0.0001524910607866508, + "loss": 0.8546, + "mean_token_accuracy": 0.7477369487285614, + "num_tokens": 59935411.0, + "step": 25910 + }, + { + "epoch": 0.2376455487301733, + "learning_rate": 0.00015247272393875493, + "loss": 0.853, + "mean_token_accuracy": 0.7396930694580078, + "num_tokens": 59958666.0, + "step": 25920 + }, + { + "epoch": 0.23773723296965252, + "learning_rate": 0.0001524543870908591, + "loss": 0.8279, + "mean_token_accuracy": 0.7489610254764557, + "num_tokens": 59981887.0, + "step": 25930 + }, + { + "epoch": 0.23782891720913174, + "learning_rate": 0.00015243605024296323, + "loss": 0.8792, + "mean_token_accuracy": 0.7404627442359925, + "num_tokens": 60006042.0, + "step": 25940 + }, + { + "epoch": 0.237920601448611, + "learning_rate": 0.00015241771339506737, + "loss": 0.8711, + "mean_token_accuracy": 0.7439409255981445, + "num_tokens": 60030124.0, + "step": 25950 + }, + { + "epoch": 0.2380122856880902, + "learning_rate": 0.00015239937654717157, + "loss": 0.8598, + "mean_token_accuracy": 0.7414111018180847, + "num_tokens": 60053152.0, + "step": 25960 + }, + { + "epoch": 0.23810396992756946, + "learning_rate": 0.0001523810396992757, + "loss": 0.8807, + "mean_token_accuracy": 0.7420764863491058, + "num_tokens": 60076507.0, + "step": 25970 + }, + { + "epoch": 0.2381956541670487, + "learning_rate": 0.00015236270285137987, + "loss": 0.8557, + "mean_token_accuracy": 0.7429322481155396, + "num_tokens": 60100421.0, + "step": 25980 + }, + { + "epoch": 0.2382873384065279, + "learning_rate": 0.000152344366003484, + "loss": 0.8628, + "mean_token_accuracy": 0.7405757248401642, + "num_tokens": 60122979.0, + "step": 25990 + }, + { + "epoch": 0.23837902264600716, + "learning_rate": 0.00015232602915558815, + "loss": 0.8441, + "mean_token_accuracy": 0.7469919562339783, + "num_tokens": 60145681.0, + "step": 26000 + }, + { + "epoch": 0.23847070688548638, + "learning_rate": 0.0001523076923076923, + "loss": 0.8747, + "mean_token_accuracy": 0.7382449448108673, + "num_tokens": 60168676.0, + "step": 26010 + }, + { + "epoch": 0.2385623911249656, + "learning_rate": 0.00015228935545979648, + "loss": 0.873, + "mean_token_accuracy": 0.7435623288154602, + "num_tokens": 60192045.0, + "step": 26020 + }, + { + "epoch": 0.23865407536444486, + "learning_rate": 0.00015227101861190064, + "loss": 0.8608, + "mean_token_accuracy": 0.7379026055335999, + "num_tokens": 60214867.0, + "step": 26030 + }, + { + "epoch": 0.23874575960392408, + "learning_rate": 0.00015225268176400478, + "loss": 0.8149, + "mean_token_accuracy": 0.7526860177516937, + "num_tokens": 60238420.0, + "step": 26040 + }, + { + "epoch": 0.23883744384340333, + "learning_rate": 0.00015223434491610892, + "loss": 0.8896, + "mean_token_accuracy": 0.7381485342979431, + "num_tokens": 60261502.0, + "step": 26050 + }, + { + "epoch": 0.23892912808288255, + "learning_rate": 0.00015221600806821308, + "loss": 0.8805, + "mean_token_accuracy": 0.7382685422897339, + "num_tokens": 60285200.0, + "step": 26060 + }, + { + "epoch": 0.23902081232236178, + "learning_rate": 0.00015219767122031722, + "loss": 0.8558, + "mean_token_accuracy": 0.7376444458961486, + "num_tokens": 60309846.0, + "step": 26070 + }, + { + "epoch": 0.23911249656184103, + "learning_rate": 0.0001521793343724214, + "loss": 0.8757, + "mean_token_accuracy": 0.7434535145759582, + "num_tokens": 60332933.0, + "step": 26080 + }, + { + "epoch": 0.23920418080132025, + "learning_rate": 0.00015216099752452555, + "loss": 0.9186, + "mean_token_accuracy": 0.7292102634906769, + "num_tokens": 60356626.0, + "step": 26090 + }, + { + "epoch": 0.2392958650407995, + "learning_rate": 0.0001521426606766297, + "loss": 0.8738, + "mean_token_accuracy": 0.7410090923309326, + "num_tokens": 60380610.0, + "step": 26100 + }, + { + "epoch": 0.23938754928027872, + "learning_rate": 0.00015212432382873386, + "loss": 0.8837, + "mean_token_accuracy": 0.7353364884853363, + "num_tokens": 60402937.0, + "step": 26110 + }, + { + "epoch": 0.23947923351975794, + "learning_rate": 0.000152105986980838, + "loss": 0.8252, + "mean_token_accuracy": 0.7505240142345428, + "num_tokens": 60426106.0, + "step": 26120 + }, + { + "epoch": 0.2395709177592372, + "learning_rate": 0.00015208765013294216, + "loss": 0.8653, + "mean_token_accuracy": 0.7438559412956238, + "num_tokens": 60448246.0, + "step": 26130 + }, + { + "epoch": 0.23966260199871642, + "learning_rate": 0.0001520693132850463, + "loss": 0.8354, + "mean_token_accuracy": 0.7442316055297852, + "num_tokens": 60471616.0, + "step": 26140 + }, + { + "epoch": 0.23975428623819564, + "learning_rate": 0.00015205097643715046, + "loss": 0.8599, + "mean_token_accuracy": 0.7502242922782898, + "num_tokens": 60495373.0, + "step": 26150 + }, + { + "epoch": 0.2398459704776749, + "learning_rate": 0.00015203263958925463, + "loss": 0.833, + "mean_token_accuracy": 0.7505661010742187, + "num_tokens": 60519805.0, + "step": 26160 + }, + { + "epoch": 0.23993765471715411, + "learning_rate": 0.00015201430274135877, + "loss": 0.8457, + "mean_token_accuracy": 0.750264585018158, + "num_tokens": 60543982.0, + "step": 26170 + }, + { + "epoch": 0.24002933895663336, + "learning_rate": 0.00015199596589346293, + "loss": 0.8764, + "mean_token_accuracy": 0.7347649276256562, + "num_tokens": 60567493.0, + "step": 26180 + }, + { + "epoch": 0.2401210231961126, + "learning_rate": 0.00015197762904556707, + "loss": 0.856, + "mean_token_accuracy": 0.7419838309288025, + "num_tokens": 60589884.0, + "step": 26190 + }, + { + "epoch": 0.2402127074355918, + "learning_rate": 0.0001519592921976712, + "loss": 0.8774, + "mean_token_accuracy": 0.7397713422775268, + "num_tokens": 60613225.0, + "step": 26200 + }, + { + "epoch": 0.24030439167507106, + "learning_rate": 0.00015194095534977538, + "loss": 0.8617, + "mean_token_accuracy": 0.743641597032547, + "num_tokens": 60637045.0, + "step": 26210 + }, + { + "epoch": 0.24039607591455028, + "learning_rate": 0.00015192261850187954, + "loss": 0.832, + "mean_token_accuracy": 0.754779440164566, + "num_tokens": 60660055.0, + "step": 26220 + }, + { + "epoch": 0.24048776015402953, + "learning_rate": 0.0001519042816539837, + "loss": 0.8741, + "mean_token_accuracy": 0.7382874011993408, + "num_tokens": 60683596.0, + "step": 26230 + }, + { + "epoch": 0.24057944439350876, + "learning_rate": 0.00015188594480608784, + "loss": 0.8374, + "mean_token_accuracy": 0.7444458305835724, + "num_tokens": 60706186.0, + "step": 26240 + }, + { + "epoch": 0.24067112863298798, + "learning_rate": 0.00015186760795819198, + "loss": 0.8438, + "mean_token_accuracy": 0.7413602232933044, + "num_tokens": 60729319.0, + "step": 26250 + }, + { + "epoch": 0.24076281287246723, + "learning_rate": 0.00015184927111029615, + "loss": 0.8076, + "mean_token_accuracy": 0.7561198234558105, + "num_tokens": 60752702.0, + "step": 26260 + }, + { + "epoch": 0.24085449711194645, + "learning_rate": 0.0001518309342624003, + "loss": 0.91, + "mean_token_accuracy": 0.7317551493644714, + "num_tokens": 60775931.0, + "step": 26270 + }, + { + "epoch": 0.2409461813514257, + "learning_rate": 0.00015181259741450445, + "loss": 0.8449, + "mean_token_accuracy": 0.7484565675258636, + "num_tokens": 60798616.0, + "step": 26280 + }, + { + "epoch": 0.24103786559090493, + "learning_rate": 0.00015179426056660862, + "loss": 0.8874, + "mean_token_accuracy": 0.7473255813121795, + "num_tokens": 60821762.0, + "step": 26290 + }, + { + "epoch": 0.24112954983038415, + "learning_rate": 0.00015177592371871276, + "loss": 0.8769, + "mean_token_accuracy": 0.7485851407051086, + "num_tokens": 60844276.0, + "step": 26300 + }, + { + "epoch": 0.2412212340698634, + "learning_rate": 0.00015175758687081692, + "loss": 0.873, + "mean_token_accuracy": 0.741224330663681, + "num_tokens": 60867688.0, + "step": 26310 + }, + { + "epoch": 0.24131291830934262, + "learning_rate": 0.00015173925002292106, + "loss": 0.8561, + "mean_token_accuracy": 0.7429096281528473, + "num_tokens": 60890773.0, + "step": 26320 + }, + { + "epoch": 0.24140460254882184, + "learning_rate": 0.00015172091317502522, + "loss": 0.8486, + "mean_token_accuracy": 0.7413500130176545, + "num_tokens": 60913280.0, + "step": 26330 + }, + { + "epoch": 0.2414962867883011, + "learning_rate": 0.00015170257632712936, + "loss": 0.8652, + "mean_token_accuracy": 0.7433875560760498, + "num_tokens": 60936647.0, + "step": 26340 + }, + { + "epoch": 0.24158797102778032, + "learning_rate": 0.00015168423947923353, + "loss": 0.8056, + "mean_token_accuracy": 0.7550627827644348, + "num_tokens": 60959907.0, + "step": 26350 + }, + { + "epoch": 0.24167965526725957, + "learning_rate": 0.0001516659026313377, + "loss": 0.8746, + "mean_token_accuracy": 0.7450252413749695, + "num_tokens": 60982569.0, + "step": 26360 + }, + { + "epoch": 0.2417713395067388, + "learning_rate": 0.00015164756578344183, + "loss": 0.8338, + "mean_token_accuracy": 0.7551529586315155, + "num_tokens": 61005896.0, + "step": 26370 + }, + { + "epoch": 0.24186302374621801, + "learning_rate": 0.000151629228935546, + "loss": 0.8407, + "mean_token_accuracy": 0.7414148271083831, + "num_tokens": 61029129.0, + "step": 26380 + }, + { + "epoch": 0.24195470798569726, + "learning_rate": 0.00015161089208765014, + "loss": 0.8037, + "mean_token_accuracy": 0.7530421197414399, + "num_tokens": 61051764.0, + "step": 26390 + }, + { + "epoch": 0.2420463922251765, + "learning_rate": 0.00015159255523975427, + "loss": 0.8652, + "mean_token_accuracy": 0.7420929193496704, + "num_tokens": 61074638.0, + "step": 26400 + }, + { + "epoch": 0.24213807646465574, + "learning_rate": 0.00015157421839185844, + "loss": 0.853, + "mean_token_accuracy": 0.7520487010478973, + "num_tokens": 61098008.0, + "step": 26410 + }, + { + "epoch": 0.24222976070413496, + "learning_rate": 0.0001515558815439626, + "loss": 0.8774, + "mean_token_accuracy": 0.7372593939304352, + "num_tokens": 61120785.0, + "step": 26420 + }, + { + "epoch": 0.24232144494361418, + "learning_rate": 0.00015153754469606677, + "loss": 0.9286, + "mean_token_accuracy": 0.7267246842384338, + "num_tokens": 61143530.0, + "step": 26430 + }, + { + "epoch": 0.24241312918309343, + "learning_rate": 0.0001515192078481709, + "loss": 0.8977, + "mean_token_accuracy": 0.7310905039310456, + "num_tokens": 61166665.0, + "step": 26440 + }, + { + "epoch": 0.24250481342257266, + "learning_rate": 0.00015150087100027505, + "loss": 0.9056, + "mean_token_accuracy": 0.7390459179878235, + "num_tokens": 61190312.0, + "step": 26450 + }, + { + "epoch": 0.24259649766205188, + "learning_rate": 0.0001514825341523792, + "loss": 0.8584, + "mean_token_accuracy": 0.7411555409431457, + "num_tokens": 61212338.0, + "step": 26460 + }, + { + "epoch": 0.24268818190153113, + "learning_rate": 0.00015146419730448335, + "loss": 0.8427, + "mean_token_accuracy": 0.7455422639846802, + "num_tokens": 61235359.0, + "step": 26470 + }, + { + "epoch": 0.24277986614101035, + "learning_rate": 0.00015144586045658752, + "loss": 0.8569, + "mean_token_accuracy": 0.7438354790210724, + "num_tokens": 61258182.0, + "step": 26480 + }, + { + "epoch": 0.2428715503804896, + "learning_rate": 0.00015142752360869168, + "loss": 0.8839, + "mean_token_accuracy": 0.7364487528800965, + "num_tokens": 61280806.0, + "step": 26490 + }, + { + "epoch": 0.24296323461996883, + "learning_rate": 0.00015140918676079582, + "loss": 0.8501, + "mean_token_accuracy": 0.7426234364509583, + "num_tokens": 61304501.0, + "step": 26500 + }, + { + "epoch": 0.24305491885944805, + "learning_rate": 0.00015139084991289999, + "loss": 0.8674, + "mean_token_accuracy": 0.7410211980342865, + "num_tokens": 61327555.0, + "step": 26510 + }, + { + "epoch": 0.2431466030989273, + "learning_rate": 0.00015137251306500412, + "loss": 0.8595, + "mean_token_accuracy": 0.7516920983791351, + "num_tokens": 61351270.0, + "step": 26520 + }, + { + "epoch": 0.24323828733840652, + "learning_rate": 0.0001513541762171083, + "loss": 0.8623, + "mean_token_accuracy": 0.7415857791900635, + "num_tokens": 61374573.0, + "step": 26530 + }, + { + "epoch": 0.24332997157788577, + "learning_rate": 0.00015133583936921243, + "loss": 0.8741, + "mean_token_accuracy": 0.7398116827011109, + "num_tokens": 61398198.0, + "step": 26540 + }, + { + "epoch": 0.243421655817365, + "learning_rate": 0.0001513175025213166, + "loss": 0.8587, + "mean_token_accuracy": 0.7457467496395112, + "num_tokens": 61421330.0, + "step": 26550 + }, + { + "epoch": 0.24351334005684422, + "learning_rate": 0.00015129916567342076, + "loss": 0.8626, + "mean_token_accuracy": 0.7473425567150116, + "num_tokens": 61444872.0, + "step": 26560 + }, + { + "epoch": 0.24360502429632347, + "learning_rate": 0.0001512808288255249, + "loss": 0.8577, + "mean_token_accuracy": 0.7467374980449677, + "num_tokens": 61468539.0, + "step": 26570 + }, + { + "epoch": 0.2436967085358027, + "learning_rate": 0.00015126249197762906, + "loss": 0.8967, + "mean_token_accuracy": 0.7340288460254669, + "num_tokens": 61491513.0, + "step": 26580 + }, + { + "epoch": 0.24378839277528194, + "learning_rate": 0.0001512441551297332, + "loss": 0.8572, + "mean_token_accuracy": 0.7451032221317291, + "num_tokens": 61514131.0, + "step": 26590 + }, + { + "epoch": 0.24388007701476117, + "learning_rate": 0.00015122581828183734, + "loss": 0.8729, + "mean_token_accuracy": 0.7386572897434235, + "num_tokens": 61538498.0, + "step": 26600 + }, + { + "epoch": 0.2439717612542404, + "learning_rate": 0.00015120748143394153, + "loss": 0.8251, + "mean_token_accuracy": 0.7478527426719666, + "num_tokens": 61562105.0, + "step": 26610 + }, + { + "epoch": 0.24406344549371964, + "learning_rate": 0.00015118914458604567, + "loss": 0.8847, + "mean_token_accuracy": 0.737487506866455, + "num_tokens": 61585307.0, + "step": 26620 + }, + { + "epoch": 0.24415512973319886, + "learning_rate": 0.00015117080773814984, + "loss": 0.843, + "mean_token_accuracy": 0.7511949062347412, + "num_tokens": 61608507.0, + "step": 26630 + }, + { + "epoch": 0.24424681397267808, + "learning_rate": 0.00015115247089025397, + "loss": 0.8279, + "mean_token_accuracy": 0.7499415636062622, + "num_tokens": 61631639.0, + "step": 26640 + }, + { + "epoch": 0.24433849821215733, + "learning_rate": 0.0001511341340423581, + "loss": 0.829, + "mean_token_accuracy": 0.7521292626857757, + "num_tokens": 61654814.0, + "step": 26650 + }, + { + "epoch": 0.24443018245163656, + "learning_rate": 0.00015111579719446228, + "loss": 0.8268, + "mean_token_accuracy": 0.7496983349323273, + "num_tokens": 61678882.0, + "step": 26660 + }, + { + "epoch": 0.2445218666911158, + "learning_rate": 0.00015109746034656642, + "loss": 0.8555, + "mean_token_accuracy": 0.7474999368190766, + "num_tokens": 61702379.0, + "step": 26670 + }, + { + "epoch": 0.24461355093059503, + "learning_rate": 0.00015107912349867058, + "loss": 0.8533, + "mean_token_accuracy": 0.7445842027664185, + "num_tokens": 61726096.0, + "step": 26680 + }, + { + "epoch": 0.24470523517007425, + "learning_rate": 0.00015106078665077475, + "loss": 0.9065, + "mean_token_accuracy": 0.7378456234931946, + "num_tokens": 61748683.0, + "step": 26690 + }, + { + "epoch": 0.2447969194095535, + "learning_rate": 0.00015104244980287888, + "loss": 0.8711, + "mean_token_accuracy": 0.7429121255874633, + "num_tokens": 61772500.0, + "step": 26700 + }, + { + "epoch": 0.24488860364903273, + "learning_rate": 0.00015102411295498305, + "loss": 0.8876, + "mean_token_accuracy": 0.7383490979671479, + "num_tokens": 61796587.0, + "step": 26710 + }, + { + "epoch": 0.24498028788851198, + "learning_rate": 0.0001510057761070872, + "loss": 0.893, + "mean_token_accuracy": 0.7369406044483184, + "num_tokens": 61819163.0, + "step": 26720 + }, + { + "epoch": 0.2450719721279912, + "learning_rate": 0.00015098743925919135, + "loss": 0.8101, + "mean_token_accuracy": 0.7523659229278564, + "num_tokens": 61842815.0, + "step": 26730 + }, + { + "epoch": 0.24516365636747042, + "learning_rate": 0.00015096910241129552, + "loss": 0.8636, + "mean_token_accuracy": 0.7446376144886017, + "num_tokens": 61866346.0, + "step": 26740 + }, + { + "epoch": 0.24525534060694967, + "learning_rate": 0.00015095076556339966, + "loss": 0.881, + "mean_token_accuracy": 0.7377575397491455, + "num_tokens": 61890179.0, + "step": 26750 + }, + { + "epoch": 0.2453470248464289, + "learning_rate": 0.00015093242871550382, + "loss": 0.8813, + "mean_token_accuracy": 0.7363186776638031, + "num_tokens": 61913063.0, + "step": 26760 + }, + { + "epoch": 0.24543870908590812, + "learning_rate": 0.00015091409186760796, + "loss": 0.8611, + "mean_token_accuracy": 0.7483425676822663, + "num_tokens": 61935806.0, + "step": 26770 + }, + { + "epoch": 0.24553039332538737, + "learning_rate": 0.00015089575501971213, + "loss": 0.8642, + "mean_token_accuracy": 0.7431134819984436, + "num_tokens": 61959200.0, + "step": 26780 + }, + { + "epoch": 0.2456220775648666, + "learning_rate": 0.00015087741817181627, + "loss": 0.8142, + "mean_token_accuracy": 0.7511698305606842, + "num_tokens": 61982728.0, + "step": 26790 + }, + { + "epoch": 0.24571376180434584, + "learning_rate": 0.0001508590813239204, + "loss": 0.8368, + "mean_token_accuracy": 0.7514487862586975, + "num_tokens": 62006017.0, + "step": 26800 + }, + { + "epoch": 0.24580544604382507, + "learning_rate": 0.0001508407444760246, + "loss": 0.8538, + "mean_token_accuracy": 0.7411257028579712, + "num_tokens": 62029398.0, + "step": 26810 + }, + { + "epoch": 0.2458971302833043, + "learning_rate": 0.00015082240762812873, + "loss": 0.8542, + "mean_token_accuracy": 0.745817244052887, + "num_tokens": 62052495.0, + "step": 26820 + }, + { + "epoch": 0.24598881452278354, + "learning_rate": 0.0001508040707802329, + "loss": 0.8226, + "mean_token_accuracy": 0.75605508685112, + "num_tokens": 62075613.0, + "step": 26830 + }, + { + "epoch": 0.24608049876226276, + "learning_rate": 0.00015078573393233704, + "loss": 0.8261, + "mean_token_accuracy": 0.7498820841312408, + "num_tokens": 62099819.0, + "step": 26840 + }, + { + "epoch": 0.246172183001742, + "learning_rate": 0.00015076739708444118, + "loss": 0.8277, + "mean_token_accuracy": 0.7518484711647033, + "num_tokens": 62121997.0, + "step": 26850 + }, + { + "epoch": 0.24626386724122123, + "learning_rate": 0.00015074906023654534, + "loss": 0.8767, + "mean_token_accuracy": 0.7354409396648407, + "num_tokens": 62145068.0, + "step": 26860 + }, + { + "epoch": 0.24635555148070046, + "learning_rate": 0.0001507307233886495, + "loss": 0.8836, + "mean_token_accuracy": 0.7420814752578735, + "num_tokens": 62168099.0, + "step": 26870 + }, + { + "epoch": 0.2464472357201797, + "learning_rate": 0.00015071238654075365, + "loss": 0.8605, + "mean_token_accuracy": 0.7410089373588562, + "num_tokens": 62191380.0, + "step": 26880 + }, + { + "epoch": 0.24653891995965893, + "learning_rate": 0.0001506940496928578, + "loss": 0.8738, + "mean_token_accuracy": 0.7459089696407318, + "num_tokens": 62214322.0, + "step": 26890 + }, + { + "epoch": 0.24663060419913818, + "learning_rate": 0.00015067571284496195, + "loss": 0.8597, + "mean_token_accuracy": 0.743206363916397, + "num_tokens": 62237955.0, + "step": 26900 + }, + { + "epoch": 0.2467222884386174, + "learning_rate": 0.00015065737599706611, + "loss": 0.895, + "mean_token_accuracy": 0.7290444374084473, + "num_tokens": 62260323.0, + "step": 26910 + }, + { + "epoch": 0.24681397267809663, + "learning_rate": 0.00015063903914917025, + "loss": 0.8891, + "mean_token_accuracy": 0.731582248210907, + "num_tokens": 62283170.0, + "step": 26920 + }, + { + "epoch": 0.24690565691757588, + "learning_rate": 0.00015062070230127442, + "loss": 0.8526, + "mean_token_accuracy": 0.7428878247737885, + "num_tokens": 62306287.0, + "step": 26930 + }, + { + "epoch": 0.2469973411570551, + "learning_rate": 0.00015060236545337858, + "loss": 0.875, + "mean_token_accuracy": 0.7361538946628571, + "num_tokens": 62329846.0, + "step": 26940 + }, + { + "epoch": 0.24708902539653432, + "learning_rate": 0.00015058402860548272, + "loss": 0.8416, + "mean_token_accuracy": 0.744611668586731, + "num_tokens": 62352767.0, + "step": 26950 + }, + { + "epoch": 0.24718070963601357, + "learning_rate": 0.0001505656917575869, + "loss": 0.8543, + "mean_token_accuracy": 0.7452895998954773, + "num_tokens": 62375546.0, + "step": 26960 + }, + { + "epoch": 0.2472723938754928, + "learning_rate": 0.00015054735490969103, + "loss": 0.9066, + "mean_token_accuracy": 0.7247574865818024, + "num_tokens": 62397916.0, + "step": 26970 + }, + { + "epoch": 0.24736407811497205, + "learning_rate": 0.0001505290180617952, + "loss": 0.8442, + "mean_token_accuracy": 0.7422787070274353, + "num_tokens": 62421526.0, + "step": 26980 + }, + { + "epoch": 0.24745576235445127, + "learning_rate": 0.00015051068121389933, + "loss": 0.8953, + "mean_token_accuracy": 0.736442220211029, + "num_tokens": 62444172.0, + "step": 26990 + }, + { + "epoch": 0.2475474465939305, + "learning_rate": 0.0001504923443660035, + "loss": 0.8931, + "mean_token_accuracy": 0.7396362960338593, + "num_tokens": 62466877.0, + "step": 27000 + }, + { + "epoch": 0.24763913083340974, + "learning_rate": 0.00015047400751810766, + "loss": 0.8734, + "mean_token_accuracy": 0.7421592712402344, + "num_tokens": 62489935.0, + "step": 27010 + }, + { + "epoch": 0.24773081507288897, + "learning_rate": 0.0001504556706702118, + "loss": 0.8624, + "mean_token_accuracy": 0.7441258907318116, + "num_tokens": 62513308.0, + "step": 27020 + }, + { + "epoch": 0.24782249931236822, + "learning_rate": 0.00015043733382231596, + "loss": 0.8577, + "mean_token_accuracy": 0.7449506878852844, + "num_tokens": 62537081.0, + "step": 27030 + }, + { + "epoch": 0.24791418355184744, + "learning_rate": 0.0001504189969744201, + "loss": 0.8491, + "mean_token_accuracy": 0.7461920797824859, + "num_tokens": 62560291.0, + "step": 27040 + }, + { + "epoch": 0.24800586779132666, + "learning_rate": 0.00015040066012652424, + "loss": 0.8852, + "mean_token_accuracy": 0.7368533611297607, + "num_tokens": 62582713.0, + "step": 27050 + }, + { + "epoch": 0.2480975520308059, + "learning_rate": 0.0001503823232786284, + "loss": 0.8317, + "mean_token_accuracy": 0.7470174729824066, + "num_tokens": 62604820.0, + "step": 27060 + }, + { + "epoch": 0.24818923627028514, + "learning_rate": 0.00015036398643073257, + "loss": 0.8722, + "mean_token_accuracy": 0.7433541059494019, + "num_tokens": 62628708.0, + "step": 27070 + }, + { + "epoch": 0.24828092050976436, + "learning_rate": 0.0001503456495828367, + "loss": 0.8394, + "mean_token_accuracy": 0.7433184921741486, + "num_tokens": 62651787.0, + "step": 27080 + }, + { + "epoch": 0.2483726047492436, + "learning_rate": 0.00015032731273494088, + "loss": 0.8791, + "mean_token_accuracy": 0.7418513059616089, + "num_tokens": 62674438.0, + "step": 27090 + }, + { + "epoch": 0.24846428898872283, + "learning_rate": 0.00015030897588704501, + "loss": 0.8435, + "mean_token_accuracy": 0.745457261800766, + "num_tokens": 62697937.0, + "step": 27100 + }, + { + "epoch": 0.24855597322820208, + "learning_rate": 0.00015029063903914918, + "loss": 0.8636, + "mean_token_accuracy": 0.7362743437290191, + "num_tokens": 62721792.0, + "step": 27110 + }, + { + "epoch": 0.2486476574676813, + "learning_rate": 0.00015027230219125332, + "loss": 0.8763, + "mean_token_accuracy": 0.7412759482860565, + "num_tokens": 62745298.0, + "step": 27120 + }, + { + "epoch": 0.24873934170716053, + "learning_rate": 0.00015025396534335748, + "loss": 0.8571, + "mean_token_accuracy": 0.7426306903362274, + "num_tokens": 62768695.0, + "step": 27130 + }, + { + "epoch": 0.24883102594663978, + "learning_rate": 0.00015023562849546165, + "loss": 0.8402, + "mean_token_accuracy": 0.7535669267177582, + "num_tokens": 62791289.0, + "step": 27140 + }, + { + "epoch": 0.248922710186119, + "learning_rate": 0.0001502172916475658, + "loss": 0.8595, + "mean_token_accuracy": 0.742111599445343, + "num_tokens": 62814872.0, + "step": 27150 + }, + { + "epoch": 0.24901439442559825, + "learning_rate": 0.00015019895479966995, + "loss": 0.8392, + "mean_token_accuracy": 0.7452911853790283, + "num_tokens": 62838316.0, + "step": 27160 + }, + { + "epoch": 0.24910607866507747, + "learning_rate": 0.0001501806179517741, + "loss": 0.8594, + "mean_token_accuracy": 0.7459239482879638, + "num_tokens": 62861706.0, + "step": 27170 + }, + { + "epoch": 0.2491977629045567, + "learning_rate": 0.00015016228110387826, + "loss": 0.9038, + "mean_token_accuracy": 0.7337956607341767, + "num_tokens": 62884501.0, + "step": 27180 + }, + { + "epoch": 0.24928944714403595, + "learning_rate": 0.0001501439442559824, + "loss": 0.8656, + "mean_token_accuracy": 0.7398990273475647, + "num_tokens": 62908622.0, + "step": 27190 + }, + { + "epoch": 0.24938113138351517, + "learning_rate": 0.00015012560740808656, + "loss": 0.8806, + "mean_token_accuracy": 0.7421919882297516, + "num_tokens": 62931700.0, + "step": 27200 + }, + { + "epoch": 0.24947281562299442, + "learning_rate": 0.00015010727056019072, + "loss": 0.8561, + "mean_token_accuracy": 0.737982589006424, + "num_tokens": 62954404.0, + "step": 27210 + }, + { + "epoch": 0.24956449986247364, + "learning_rate": 0.00015008893371229486, + "loss": 0.8835, + "mean_token_accuracy": 0.7433018922805786, + "num_tokens": 62977991.0, + "step": 27220 + }, + { + "epoch": 0.24965618410195287, + "learning_rate": 0.00015007059686439903, + "loss": 0.7948, + "mean_token_accuracy": 0.7564925909042358, + "num_tokens": 63000780.0, + "step": 27230 + }, + { + "epoch": 0.24974786834143212, + "learning_rate": 0.00015005226001650317, + "loss": 0.8492, + "mean_token_accuracy": 0.7499097645282745, + "num_tokens": 63024223.0, + "step": 27240 + }, + { + "epoch": 0.24983955258091134, + "learning_rate": 0.0001500339231686073, + "loss": 0.8453, + "mean_token_accuracy": 0.7465799510478973, + "num_tokens": 63047655.0, + "step": 27250 + }, + { + "epoch": 0.24993123682039056, + "learning_rate": 0.0001500155863207115, + "loss": 0.8161, + "mean_token_accuracy": 0.7452511370182038, + "num_tokens": 63070714.0, + "step": 27260 + }, + { + "epoch": 0.2500229210598698, + "learning_rate": 0.00014999724947281564, + "loss": 0.817, + "mean_token_accuracy": 0.7468233466148376, + "num_tokens": 63093706.0, + "step": 27270 + }, + { + "epoch": 0.25011460529934904, + "learning_rate": 0.00014997891262491977, + "loss": 0.8397, + "mean_token_accuracy": 0.7532055139541626, + "num_tokens": 63116413.0, + "step": 27280 + }, + { + "epoch": 0.2502062895388283, + "learning_rate": 0.00014996057577702394, + "loss": 0.841, + "mean_token_accuracy": 0.7506026148796081, + "num_tokens": 63140020.0, + "step": 27290 + }, + { + "epoch": 0.25029797377830754, + "learning_rate": 0.00014994223892912808, + "loss": 0.9062, + "mean_token_accuracy": 0.732699579000473, + "num_tokens": 63163403.0, + "step": 27300 + }, + { + "epoch": 0.25038965801778673, + "learning_rate": 0.00014992390208123224, + "loss": 0.8586, + "mean_token_accuracy": 0.7432677268981933, + "num_tokens": 63186589.0, + "step": 27310 + }, + { + "epoch": 0.250481342257266, + "learning_rate": 0.00014990556523333638, + "loss": 0.8401, + "mean_token_accuracy": 0.7463052451610566, + "num_tokens": 63211032.0, + "step": 27320 + }, + { + "epoch": 0.25057302649674523, + "learning_rate": 0.00014988722838544055, + "loss": 0.8661, + "mean_token_accuracy": 0.7454921841621399, + "num_tokens": 63233942.0, + "step": 27330 + }, + { + "epoch": 0.2506647107362244, + "learning_rate": 0.0001498688915375447, + "loss": 0.853, + "mean_token_accuracy": 0.7432247877120972, + "num_tokens": 63256252.0, + "step": 27340 + }, + { + "epoch": 0.2507563949757037, + "learning_rate": 0.00014985055468964885, + "loss": 0.8242, + "mean_token_accuracy": 0.7477229058742523, + "num_tokens": 63280037.0, + "step": 27350 + }, + { + "epoch": 0.25084807921518293, + "learning_rate": 0.00014983221784175302, + "loss": 0.8703, + "mean_token_accuracy": 0.7464641690254211, + "num_tokens": 63302481.0, + "step": 27360 + }, + { + "epoch": 0.2509397634546621, + "learning_rate": 0.00014981388099385715, + "loss": 0.8309, + "mean_token_accuracy": 0.7471476495265961, + "num_tokens": 63325954.0, + "step": 27370 + }, + { + "epoch": 0.2510314476941414, + "learning_rate": 0.00014979554414596132, + "loss": 0.8698, + "mean_token_accuracy": 0.7405181527137756, + "num_tokens": 63348730.0, + "step": 27380 + }, + { + "epoch": 0.2511231319336206, + "learning_rate": 0.00014977720729806549, + "loss": 0.8874, + "mean_token_accuracy": 0.7401892364025116, + "num_tokens": 63370900.0, + "step": 27390 + }, + { + "epoch": 0.2512148161730998, + "learning_rate": 0.00014975887045016962, + "loss": 0.8456, + "mean_token_accuracy": 0.743671715259552, + "num_tokens": 63393906.0, + "step": 27400 + }, + { + "epoch": 0.25130650041257907, + "learning_rate": 0.0001497405336022738, + "loss": 0.8673, + "mean_token_accuracy": 0.7424066245555878, + "num_tokens": 63417663.0, + "step": 27410 + }, + { + "epoch": 0.2513981846520583, + "learning_rate": 0.00014972219675437793, + "loss": 0.8321, + "mean_token_accuracy": 0.7520144999027252, + "num_tokens": 63440724.0, + "step": 27420 + }, + { + "epoch": 0.25148986889153757, + "learning_rate": 0.0001497038599064821, + "loss": 0.859, + "mean_token_accuracy": 0.741386330127716, + "num_tokens": 63462970.0, + "step": 27430 + }, + { + "epoch": 0.25158155313101677, + "learning_rate": 0.00014968552305858623, + "loss": 0.8433, + "mean_token_accuracy": 0.7527381777763367, + "num_tokens": 63485825.0, + "step": 27440 + }, + { + "epoch": 0.251673237370496, + "learning_rate": 0.00014966718621069037, + "loss": 0.8802, + "mean_token_accuracy": 0.739150595664978, + "num_tokens": 63508316.0, + "step": 27450 + }, + { + "epoch": 0.25176492160997527, + "learning_rate": 0.00014964884936279456, + "loss": 0.8475, + "mean_token_accuracy": 0.7439385056495667, + "num_tokens": 63531956.0, + "step": 27460 + }, + { + "epoch": 0.25185660584945446, + "learning_rate": 0.0001496305125148987, + "loss": 0.8215, + "mean_token_accuracy": 0.7559373676776886, + "num_tokens": 63554944.0, + "step": 27470 + }, + { + "epoch": 0.2519482900889337, + "learning_rate": 0.00014961217566700284, + "loss": 0.8358, + "mean_token_accuracy": 0.7509729623794555, + "num_tokens": 63578468.0, + "step": 27480 + }, + { + "epoch": 0.25203997432841296, + "learning_rate": 0.000149593838819107, + "loss": 0.8713, + "mean_token_accuracy": 0.7407134234905243, + "num_tokens": 63601170.0, + "step": 27490 + }, + { + "epoch": 0.25213165856789216, + "learning_rate": 0.00014957550197121114, + "loss": 0.8394, + "mean_token_accuracy": 0.7518621146678924, + "num_tokens": 63625539.0, + "step": 27500 + }, + { + "epoch": 0.2522233428073714, + "learning_rate": 0.0001495571651233153, + "loss": 0.8454, + "mean_token_accuracy": 0.7450213611125946, + "num_tokens": 63649273.0, + "step": 27510 + }, + { + "epoch": 0.25231502704685066, + "learning_rate": 0.00014953882827541947, + "loss": 0.8671, + "mean_token_accuracy": 0.740081399679184, + "num_tokens": 63672100.0, + "step": 27520 + }, + { + "epoch": 0.25240671128632985, + "learning_rate": 0.0001495204914275236, + "loss": 0.8434, + "mean_token_accuracy": 0.7457730114459992, + "num_tokens": 63695148.0, + "step": 27530 + }, + { + "epoch": 0.2524983955258091, + "learning_rate": 0.00014950215457962778, + "loss": 0.8739, + "mean_token_accuracy": 0.739480984210968, + "num_tokens": 63718328.0, + "step": 27540 + }, + { + "epoch": 0.25259007976528836, + "learning_rate": 0.00014948381773173192, + "loss": 0.814, + "mean_token_accuracy": 0.7560616672039032, + "num_tokens": 63741194.0, + "step": 27550 + }, + { + "epoch": 0.2526817640047676, + "learning_rate": 0.00014946548088383608, + "loss": 0.8461, + "mean_token_accuracy": 0.7488047420978546, + "num_tokens": 63764382.0, + "step": 27560 + }, + { + "epoch": 0.2527734482442468, + "learning_rate": 0.00014944714403594022, + "loss": 0.8337, + "mean_token_accuracy": 0.7544873893260956, + "num_tokens": 63788497.0, + "step": 27570 + }, + { + "epoch": 0.25286513248372605, + "learning_rate": 0.00014942880718804438, + "loss": 0.8687, + "mean_token_accuracy": 0.7343391597270965, + "num_tokens": 63811426.0, + "step": 27580 + }, + { + "epoch": 0.2529568167232053, + "learning_rate": 0.00014941047034014855, + "loss": 0.8467, + "mean_token_accuracy": 0.7463156521320343, + "num_tokens": 63833993.0, + "step": 27590 + }, + { + "epoch": 0.2530485009626845, + "learning_rate": 0.0001493921334922527, + "loss": 0.8813, + "mean_token_accuracy": 0.7421612560749054, + "num_tokens": 63856580.0, + "step": 27600 + }, + { + "epoch": 0.25314018520216375, + "learning_rate": 0.00014937379664435685, + "loss": 0.855, + "mean_token_accuracy": 0.7461703479290008, + "num_tokens": 63879804.0, + "step": 27610 + }, + { + "epoch": 0.253231869441643, + "learning_rate": 0.000149355459796461, + "loss": 0.8453, + "mean_token_accuracy": 0.744089663028717, + "num_tokens": 63902235.0, + "step": 27620 + }, + { + "epoch": 0.2533235536811222, + "learning_rate": 0.00014933712294856516, + "loss": 0.8367, + "mean_token_accuracy": 0.7552065253257751, + "num_tokens": 63924451.0, + "step": 27630 + }, + { + "epoch": 0.25341523792060144, + "learning_rate": 0.0001493187861006693, + "loss": 0.8366, + "mean_token_accuracy": 0.7422115445137024, + "num_tokens": 63947429.0, + "step": 27640 + }, + { + "epoch": 0.2535069221600807, + "learning_rate": 0.00014930044925277343, + "loss": 0.8403, + "mean_token_accuracy": 0.7481965363025666, + "num_tokens": 63970539.0, + "step": 27650 + }, + { + "epoch": 0.2535986063995599, + "learning_rate": 0.00014928211240487763, + "loss": 0.8954, + "mean_token_accuracy": 0.7365795850753785, + "num_tokens": 63994385.0, + "step": 27660 + }, + { + "epoch": 0.25369029063903914, + "learning_rate": 0.00014926377555698176, + "loss": 0.8895, + "mean_token_accuracy": 0.736483770608902, + "num_tokens": 64017109.0, + "step": 27670 + }, + { + "epoch": 0.2537819748785184, + "learning_rate": 0.0001492454387090859, + "loss": 0.794, + "mean_token_accuracy": 0.7664094746112824, + "num_tokens": 64040056.0, + "step": 27680 + }, + { + "epoch": 0.25387365911799764, + "learning_rate": 0.00014922710186119007, + "loss": 0.8667, + "mean_token_accuracy": 0.7422010958194732, + "num_tokens": 64063168.0, + "step": 27690 + }, + { + "epoch": 0.25396534335747684, + "learning_rate": 0.0001492087650132942, + "loss": 0.8845, + "mean_token_accuracy": 0.73812175989151, + "num_tokens": 64086260.0, + "step": 27700 + }, + { + "epoch": 0.2540570275969561, + "learning_rate": 0.00014919042816539837, + "loss": 0.8224, + "mean_token_accuracy": 0.7560637831687927, + "num_tokens": 64110765.0, + "step": 27710 + }, + { + "epoch": 0.25414871183643534, + "learning_rate": 0.00014917209131750254, + "loss": 0.8671, + "mean_token_accuracy": 0.7410921573638916, + "num_tokens": 64133797.0, + "step": 27720 + }, + { + "epoch": 0.25424039607591453, + "learning_rate": 0.00014915375446960668, + "loss": 0.8652, + "mean_token_accuracy": 0.7404982089996338, + "num_tokens": 64156972.0, + "step": 27730 + }, + { + "epoch": 0.2543320803153938, + "learning_rate": 0.00014913541762171084, + "loss": 0.8336, + "mean_token_accuracy": 0.7471336543560028, + "num_tokens": 64180484.0, + "step": 27740 + }, + { + "epoch": 0.25442376455487303, + "learning_rate": 0.00014911708077381498, + "loss": 0.902, + "mean_token_accuracy": 0.7338102877140045, + "num_tokens": 64203458.0, + "step": 27750 + }, + { + "epoch": 0.25451544879435223, + "learning_rate": 0.00014909874392591915, + "loss": 0.8794, + "mean_token_accuracy": 0.742933839559555, + "num_tokens": 64226780.0, + "step": 27760 + }, + { + "epoch": 0.2546071330338315, + "learning_rate": 0.00014908040707802328, + "loss": 0.8968, + "mean_token_accuracy": 0.7303280770778656, + "num_tokens": 64250066.0, + "step": 27770 + }, + { + "epoch": 0.25469881727331073, + "learning_rate": 0.00014906207023012745, + "loss": 0.8363, + "mean_token_accuracy": 0.7506760716438293, + "num_tokens": 64272875.0, + "step": 27780 + }, + { + "epoch": 0.2547905015127899, + "learning_rate": 0.00014904373338223161, + "loss": 0.8555, + "mean_token_accuracy": 0.7442705988883972, + "num_tokens": 64296047.0, + "step": 27790 + }, + { + "epoch": 0.2548821857522692, + "learning_rate": 0.00014902539653433575, + "loss": 0.8578, + "mean_token_accuracy": 0.749461966753006, + "num_tokens": 64318818.0, + "step": 27800 + }, + { + "epoch": 0.2549738699917484, + "learning_rate": 0.00014900705968643992, + "loss": 0.8371, + "mean_token_accuracy": 0.7498965322971344, + "num_tokens": 64342462.0, + "step": 27810 + }, + { + "epoch": 0.2550655542312277, + "learning_rate": 0.00014898872283854406, + "loss": 0.8697, + "mean_token_accuracy": 0.7387650489807129, + "num_tokens": 64365382.0, + "step": 27820 + }, + { + "epoch": 0.25515723847070687, + "learning_rate": 0.00014897038599064822, + "loss": 0.8848, + "mean_token_accuracy": 0.7320538461208344, + "num_tokens": 64388493.0, + "step": 27830 + }, + { + "epoch": 0.2552489227101861, + "learning_rate": 0.00014895204914275236, + "loss": 0.8112, + "mean_token_accuracy": 0.7556831479072571, + "num_tokens": 64411274.0, + "step": 27840 + }, + { + "epoch": 0.25534060694966537, + "learning_rate": 0.00014893371229485653, + "loss": 0.8541, + "mean_token_accuracy": 0.7366828501224518, + "num_tokens": 64433665.0, + "step": 27850 + }, + { + "epoch": 0.25543229118914457, + "learning_rate": 0.0001489153754469607, + "loss": 0.8689, + "mean_token_accuracy": 0.7413061380386352, + "num_tokens": 64456799.0, + "step": 27860 + }, + { + "epoch": 0.2555239754286238, + "learning_rate": 0.00014889703859906483, + "loss": 0.8824, + "mean_token_accuracy": 0.7397329449653626, + "num_tokens": 64480108.0, + "step": 27870 + }, + { + "epoch": 0.25561565966810307, + "learning_rate": 0.00014887870175116897, + "loss": 0.847, + "mean_token_accuracy": 0.749979555606842, + "num_tokens": 64503395.0, + "step": 27880 + }, + { + "epoch": 0.25570734390758226, + "learning_rate": 0.00014886036490327313, + "loss": 0.8703, + "mean_token_accuracy": 0.7492643415927887, + "num_tokens": 64526547.0, + "step": 27890 + }, + { + "epoch": 0.2557990281470615, + "learning_rate": 0.00014884202805537727, + "loss": 0.843, + "mean_token_accuracy": 0.7489019095897674, + "num_tokens": 64549687.0, + "step": 27900 + }, + { + "epoch": 0.25589071238654076, + "learning_rate": 0.00014882369120748144, + "loss": 0.8737, + "mean_token_accuracy": 0.7379236459732056, + "num_tokens": 64572307.0, + "step": 27910 + }, + { + "epoch": 0.25598239662602, + "learning_rate": 0.0001488053543595856, + "loss": 0.855, + "mean_token_accuracy": 0.7451977670192719, + "num_tokens": 64595770.0, + "step": 27920 + }, + { + "epoch": 0.2560740808654992, + "learning_rate": 0.00014878701751168974, + "loss": 0.8543, + "mean_token_accuracy": 0.7364241421222687, + "num_tokens": 64618894.0, + "step": 27930 + }, + { + "epoch": 0.25616576510497846, + "learning_rate": 0.0001487686806637939, + "loss": 0.8322, + "mean_token_accuracy": 0.7494477868080139, + "num_tokens": 64641565.0, + "step": 27940 + }, + { + "epoch": 0.2562574493444577, + "learning_rate": 0.00014875034381589804, + "loss": 0.8448, + "mean_token_accuracy": 0.7500940978527069, + "num_tokens": 64665238.0, + "step": 27950 + }, + { + "epoch": 0.2563491335839369, + "learning_rate": 0.0001487320069680022, + "loss": 0.8758, + "mean_token_accuracy": 0.7441661059856415, + "num_tokens": 64688977.0, + "step": 27960 + }, + { + "epoch": 0.25644081782341616, + "learning_rate": 0.00014871367012010635, + "loss": 0.832, + "mean_token_accuracy": 0.7484582185745239, + "num_tokens": 64711971.0, + "step": 27970 + }, + { + "epoch": 0.2565325020628954, + "learning_rate": 0.0001486953332722105, + "loss": 0.8404, + "mean_token_accuracy": 0.7460843920707703, + "num_tokens": 64735269.0, + "step": 27980 + }, + { + "epoch": 0.2566241863023746, + "learning_rate": 0.00014867699642431468, + "loss": 0.9121, + "mean_token_accuracy": 0.7320519149303436, + "num_tokens": 64758426.0, + "step": 27990 + }, + { + "epoch": 0.25671587054185385, + "learning_rate": 0.00014865865957641882, + "loss": 0.8686, + "mean_token_accuracy": 0.7345442593097686, + "num_tokens": 64781597.0, + "step": 28000 + }, + { + "epoch": 0.2568075547813331, + "learning_rate": 0.00014864032272852298, + "loss": 0.8328, + "mean_token_accuracy": 0.7472794055938721, + "num_tokens": 64805020.0, + "step": 28010 + }, + { + "epoch": 0.2568992390208123, + "learning_rate": 0.00014862198588062712, + "loss": 0.8096, + "mean_token_accuracy": 0.7494252622127533, + "num_tokens": 64828278.0, + "step": 28020 + }, + { + "epoch": 0.25699092326029155, + "learning_rate": 0.00014860364903273129, + "loss": 0.869, + "mean_token_accuracy": 0.7407665729522706, + "num_tokens": 64850841.0, + "step": 28030 + }, + { + "epoch": 0.2570826074997708, + "learning_rate": 0.00014858531218483542, + "loss": 0.8318, + "mean_token_accuracy": 0.7525594234466553, + "num_tokens": 64873107.0, + "step": 28040 + }, + { + "epoch": 0.25717429173925005, + "learning_rate": 0.0001485669753369396, + "loss": 0.8449, + "mean_token_accuracy": 0.7486140429973602, + "num_tokens": 64896635.0, + "step": 28050 + }, + { + "epoch": 0.25726597597872924, + "learning_rate": 0.00014854863848904376, + "loss": 0.9136, + "mean_token_accuracy": 0.7302045464515686, + "num_tokens": 64920819.0, + "step": 28060 + }, + { + "epoch": 0.2573576602182085, + "learning_rate": 0.0001485303016411479, + "loss": 0.8725, + "mean_token_accuracy": 0.7373661279678345, + "num_tokens": 64943333.0, + "step": 28070 + }, + { + "epoch": 0.25744934445768775, + "learning_rate": 0.00014851196479325203, + "loss": 0.8991, + "mean_token_accuracy": 0.7330242574214936, + "num_tokens": 64966510.0, + "step": 28080 + }, + { + "epoch": 0.25754102869716694, + "learning_rate": 0.0001484936279453562, + "loss": 0.8844, + "mean_token_accuracy": 0.7403602242469788, + "num_tokens": 64989669.0, + "step": 28090 + }, + { + "epoch": 0.2576327129366462, + "learning_rate": 0.00014847529109746034, + "loss": 0.8483, + "mean_token_accuracy": 0.7522640228271484, + "num_tokens": 65012931.0, + "step": 28100 + }, + { + "epoch": 0.25772439717612544, + "learning_rate": 0.00014845695424956453, + "loss": 0.864, + "mean_token_accuracy": 0.7439845263957977, + "num_tokens": 65035544.0, + "step": 28110 + }, + { + "epoch": 0.25781608141560464, + "learning_rate": 0.00014843861740166867, + "loss": 0.868, + "mean_token_accuracy": 0.7458803355693817, + "num_tokens": 65058158.0, + "step": 28120 + }, + { + "epoch": 0.2579077656550839, + "learning_rate": 0.0001484202805537728, + "loss": 0.8467, + "mean_token_accuracy": 0.7457037091255188, + "num_tokens": 65081277.0, + "step": 28130 + }, + { + "epoch": 0.25799944989456314, + "learning_rate": 0.00014840194370587697, + "loss": 0.8278, + "mean_token_accuracy": 0.756156575679779, + "num_tokens": 65104023.0, + "step": 28140 + }, + { + "epoch": 0.25809113413404233, + "learning_rate": 0.0001483836068579811, + "loss": 0.7927, + "mean_token_accuracy": 0.7523608386516571, + "num_tokens": 65127045.0, + "step": 28150 + }, + { + "epoch": 0.2581828183735216, + "learning_rate": 0.00014836527001008527, + "loss": 0.8964, + "mean_token_accuracy": 0.7322318434715271, + "num_tokens": 65150294.0, + "step": 28160 + }, + { + "epoch": 0.25827450261300083, + "learning_rate": 0.0001483469331621894, + "loss": 0.8567, + "mean_token_accuracy": 0.7436087250709533, + "num_tokens": 65172773.0, + "step": 28170 + }, + { + "epoch": 0.2583661868524801, + "learning_rate": 0.00014832859631429358, + "loss": 0.848, + "mean_token_accuracy": 0.7448115289211273, + "num_tokens": 65196296.0, + "step": 28180 + }, + { + "epoch": 0.2584578710919593, + "learning_rate": 0.00014831025946639774, + "loss": 0.8195, + "mean_token_accuracy": 0.7525208175182343, + "num_tokens": 65219469.0, + "step": 28190 + }, + { + "epoch": 0.25854955533143853, + "learning_rate": 0.00014829192261850188, + "loss": 0.8904, + "mean_token_accuracy": 0.735933917760849, + "num_tokens": 65242975.0, + "step": 28200 + }, + { + "epoch": 0.2586412395709178, + "learning_rate": 0.00014827358577060605, + "loss": 0.9345, + "mean_token_accuracy": 0.7288546979427337, + "num_tokens": 65265797.0, + "step": 28210 + }, + { + "epoch": 0.258732923810397, + "learning_rate": 0.00014825524892271019, + "loss": 0.8826, + "mean_token_accuracy": 0.736388212442398, + "num_tokens": 65288984.0, + "step": 28220 + }, + { + "epoch": 0.2588246080498762, + "learning_rate": 0.00014823691207481435, + "loss": 0.8588, + "mean_token_accuracy": 0.7434767723083496, + "num_tokens": 65313165.0, + "step": 28230 + }, + { + "epoch": 0.2589162922893555, + "learning_rate": 0.00014821857522691852, + "loss": 0.8781, + "mean_token_accuracy": 0.7393793523311615, + "num_tokens": 65335543.0, + "step": 28240 + }, + { + "epoch": 0.25900797652883467, + "learning_rate": 0.00014820023837902265, + "loss": 0.8239, + "mean_token_accuracy": 0.7503474652767181, + "num_tokens": 65359806.0, + "step": 28250 + }, + { + "epoch": 0.2590996607683139, + "learning_rate": 0.00014818190153112682, + "loss": 0.8724, + "mean_token_accuracy": 0.7347579777240754, + "num_tokens": 65382585.0, + "step": 28260 + }, + { + "epoch": 0.2591913450077932, + "learning_rate": 0.00014816356468323096, + "loss": 0.8638, + "mean_token_accuracy": 0.7446154773235321, + "num_tokens": 65406208.0, + "step": 28270 + }, + { + "epoch": 0.25928302924727237, + "learning_rate": 0.0001481452278353351, + "loss": 0.8457, + "mean_token_accuracy": 0.7462586760520935, + "num_tokens": 65429819.0, + "step": 28280 + }, + { + "epoch": 0.2593747134867516, + "learning_rate": 0.00014812689098743926, + "loss": 0.8707, + "mean_token_accuracy": 0.7396560609340668, + "num_tokens": 65452921.0, + "step": 28290 + }, + { + "epoch": 0.25946639772623087, + "learning_rate": 0.0001481085541395434, + "loss": 0.8768, + "mean_token_accuracy": 0.7417271196842193, + "num_tokens": 65476641.0, + "step": 28300 + }, + { + "epoch": 0.2595580819657101, + "learning_rate": 0.0001480902172916476, + "loss": 0.8541, + "mean_token_accuracy": 0.7493411481380463, + "num_tokens": 65499848.0, + "step": 28310 + }, + { + "epoch": 0.2596497662051893, + "learning_rate": 0.00014807188044375173, + "loss": 0.8282, + "mean_token_accuracy": 0.7527835428714752, + "num_tokens": 65521786.0, + "step": 28320 + }, + { + "epoch": 0.25974145044466856, + "learning_rate": 0.00014805354359585587, + "loss": 0.8615, + "mean_token_accuracy": 0.7430724859237671, + "num_tokens": 65544046.0, + "step": 28330 + }, + { + "epoch": 0.2598331346841478, + "learning_rate": 0.00014803520674796003, + "loss": 0.8215, + "mean_token_accuracy": 0.7531533479690552, + "num_tokens": 65566841.0, + "step": 28340 + }, + { + "epoch": 0.259924818923627, + "learning_rate": 0.00014801686990006417, + "loss": 0.8468, + "mean_token_accuracy": 0.7496873915195466, + "num_tokens": 65589363.0, + "step": 28350 + }, + { + "epoch": 0.26001650316310626, + "learning_rate": 0.00014799853305216834, + "loss": 0.8627, + "mean_token_accuracy": 0.7484847903251648, + "num_tokens": 65612743.0, + "step": 28360 + }, + { + "epoch": 0.2601081874025855, + "learning_rate": 0.0001479801962042725, + "loss": 0.8304, + "mean_token_accuracy": 0.7515036821365356, + "num_tokens": 65635628.0, + "step": 28370 + }, + { + "epoch": 0.2601998716420647, + "learning_rate": 0.00014796185935637664, + "loss": 0.8287, + "mean_token_accuracy": 0.7580148875713348, + "num_tokens": 65659904.0, + "step": 28380 + }, + { + "epoch": 0.26029155588154396, + "learning_rate": 0.0001479435225084808, + "loss": 0.8814, + "mean_token_accuracy": 0.7388691902160645, + "num_tokens": 65682954.0, + "step": 28390 + }, + { + "epoch": 0.2603832401210232, + "learning_rate": 0.00014792518566058495, + "loss": 0.8345, + "mean_token_accuracy": 0.7522849917411805, + "num_tokens": 65706837.0, + "step": 28400 + }, + { + "epoch": 0.2604749243605024, + "learning_rate": 0.0001479068488126891, + "loss": 0.8412, + "mean_token_accuracy": 0.750131368637085, + "num_tokens": 65729766.0, + "step": 28410 + }, + { + "epoch": 0.26056660859998165, + "learning_rate": 0.00014788851196479325, + "loss": 0.8731, + "mean_token_accuracy": 0.7444917023181915, + "num_tokens": 65752106.0, + "step": 28420 + }, + { + "epoch": 0.2606582928394609, + "learning_rate": 0.00014787017511689742, + "loss": 0.8513, + "mean_token_accuracy": 0.7475113570690155, + "num_tokens": 65774994.0, + "step": 28430 + }, + { + "epoch": 0.26074997707894015, + "learning_rate": 0.00014785183826900158, + "loss": 0.8466, + "mean_token_accuracy": 0.7454447269439697, + "num_tokens": 65798226.0, + "step": 28440 + }, + { + "epoch": 0.26084166131841935, + "learning_rate": 0.00014783350142110572, + "loss": 0.8825, + "mean_token_accuracy": 0.7391950786113739, + "num_tokens": 65821982.0, + "step": 28450 + }, + { + "epoch": 0.2609333455578986, + "learning_rate": 0.00014781516457320988, + "loss": 0.8632, + "mean_token_accuracy": 0.7417172074317933, + "num_tokens": 65845979.0, + "step": 28460 + }, + { + "epoch": 0.26102502979737785, + "learning_rate": 0.00014779682772531402, + "loss": 0.8217, + "mean_token_accuracy": 0.7534918189048767, + "num_tokens": 65868720.0, + "step": 28470 + }, + { + "epoch": 0.26111671403685704, + "learning_rate": 0.00014777849087741816, + "loss": 0.8573, + "mean_token_accuracy": 0.740533709526062, + "num_tokens": 65893097.0, + "step": 28480 + }, + { + "epoch": 0.2612083982763363, + "learning_rate": 0.00014776015402952233, + "loss": 0.8681, + "mean_token_accuracy": 0.7428515791893006, + "num_tokens": 65916086.0, + "step": 28490 + }, + { + "epoch": 0.26130008251581555, + "learning_rate": 0.0001477418171816265, + "loss": 0.8632, + "mean_token_accuracy": 0.7424728989601135, + "num_tokens": 65938757.0, + "step": 28500 + }, + { + "epoch": 0.26139176675529474, + "learning_rate": 0.00014772348033373066, + "loss": 0.8589, + "mean_token_accuracy": 0.7380162298679351, + "num_tokens": 65962216.0, + "step": 28510 + }, + { + "epoch": 0.261483450994774, + "learning_rate": 0.0001477051434858348, + "loss": 0.8754, + "mean_token_accuracy": 0.7504049718379975, + "num_tokens": 65984995.0, + "step": 28520 + }, + { + "epoch": 0.26157513523425324, + "learning_rate": 0.00014768680663793893, + "loss": 0.8608, + "mean_token_accuracy": 0.7417503893375397, + "num_tokens": 66008025.0, + "step": 28530 + }, + { + "epoch": 0.2616668194737325, + "learning_rate": 0.0001476684697900431, + "loss": 0.8235, + "mean_token_accuracy": 0.7488840878009796, + "num_tokens": 66031154.0, + "step": 28540 + }, + { + "epoch": 0.2617585037132117, + "learning_rate": 0.00014765013294214724, + "loss": 0.8707, + "mean_token_accuracy": 0.7523537755012513, + "num_tokens": 66054178.0, + "step": 28550 + }, + { + "epoch": 0.26185018795269094, + "learning_rate": 0.0001476317960942514, + "loss": 0.8835, + "mean_token_accuracy": 0.7428346157073975, + "num_tokens": 66077158.0, + "step": 28560 + }, + { + "epoch": 0.2619418721921702, + "learning_rate": 0.00014761345924635557, + "loss": 0.8502, + "mean_token_accuracy": 0.7426634967327118, + "num_tokens": 66099979.0, + "step": 28570 + }, + { + "epoch": 0.2620335564316494, + "learning_rate": 0.0001475951223984597, + "loss": 0.8594, + "mean_token_accuracy": 0.745317006111145, + "num_tokens": 66122506.0, + "step": 28580 + }, + { + "epoch": 0.26212524067112863, + "learning_rate": 0.00014757678555056387, + "loss": 0.8215, + "mean_token_accuracy": 0.7506672024726868, + "num_tokens": 66145201.0, + "step": 28590 + }, + { + "epoch": 0.2622169249106079, + "learning_rate": 0.000147558448702668, + "loss": 0.8259, + "mean_token_accuracy": 0.750843733549118, + "num_tokens": 66168813.0, + "step": 28600 + }, + { + "epoch": 0.2623086091500871, + "learning_rate": 0.00014754011185477218, + "loss": 0.821, + "mean_token_accuracy": 0.7530823886394501, + "num_tokens": 66192111.0, + "step": 28610 + }, + { + "epoch": 0.26240029338956633, + "learning_rate": 0.00014752177500687631, + "loss": 0.8429, + "mean_token_accuracy": 0.7440512835979461, + "num_tokens": 66215335.0, + "step": 28620 + }, + { + "epoch": 0.2624919776290456, + "learning_rate": 0.00014750343815898048, + "loss": 0.8664, + "mean_token_accuracy": 0.739682936668396, + "num_tokens": 66238485.0, + "step": 28630 + }, + { + "epoch": 0.2625836618685248, + "learning_rate": 0.00014748510131108465, + "loss": 0.8329, + "mean_token_accuracy": 0.7496993005275726, + "num_tokens": 66261317.0, + "step": 28640 + }, + { + "epoch": 0.262675346108004, + "learning_rate": 0.00014746676446318878, + "loss": 0.8359, + "mean_token_accuracy": 0.7488134264945984, + "num_tokens": 66285067.0, + "step": 28650 + }, + { + "epoch": 0.2627670303474833, + "learning_rate": 0.00014744842761529295, + "loss": 0.8728, + "mean_token_accuracy": 0.7370449006557465, + "num_tokens": 66308060.0, + "step": 28660 + }, + { + "epoch": 0.2628587145869625, + "learning_rate": 0.0001474300907673971, + "loss": 0.893, + "mean_token_accuracy": 0.739249175786972, + "num_tokens": 66332005.0, + "step": 28670 + }, + { + "epoch": 0.2629503988264417, + "learning_rate": 0.00014741175391950123, + "loss": 0.873, + "mean_token_accuracy": 0.7420450985431671, + "num_tokens": 66355210.0, + "step": 28680 + }, + { + "epoch": 0.263042083065921, + "learning_rate": 0.0001473934170716054, + "loss": 0.8636, + "mean_token_accuracy": 0.744170343875885, + "num_tokens": 66378389.0, + "step": 28690 + }, + { + "epoch": 0.2631337673054002, + "learning_rate": 0.00014737508022370956, + "loss": 0.8733, + "mean_token_accuracy": 0.7426165461540222, + "num_tokens": 66401536.0, + "step": 28700 + }, + { + "epoch": 0.2632254515448794, + "learning_rate": 0.00014735674337581372, + "loss": 0.8634, + "mean_token_accuracy": 0.7362983167171478, + "num_tokens": 66424685.0, + "step": 28710 + }, + { + "epoch": 0.26331713578435867, + "learning_rate": 0.00014733840652791786, + "loss": 0.852, + "mean_token_accuracy": 0.74595428109169, + "num_tokens": 66447837.0, + "step": 28720 + }, + { + "epoch": 0.2634088200238379, + "learning_rate": 0.000147320069680022, + "loss": 0.8692, + "mean_token_accuracy": 0.7449594378471375, + "num_tokens": 66471085.0, + "step": 28730 + }, + { + "epoch": 0.2635005042633171, + "learning_rate": 0.00014730173283212616, + "loss": 0.8246, + "mean_token_accuracy": 0.7552474617958069, + "num_tokens": 66493931.0, + "step": 28740 + }, + { + "epoch": 0.26359218850279637, + "learning_rate": 0.0001472833959842303, + "loss": 0.852, + "mean_token_accuracy": 0.7436244904994964, + "num_tokens": 66516820.0, + "step": 28750 + }, + { + "epoch": 0.2636838727422756, + "learning_rate": 0.0001472650591363345, + "loss": 0.8601, + "mean_token_accuracy": 0.7436582863330841, + "num_tokens": 66540533.0, + "step": 28760 + }, + { + "epoch": 0.2637755569817548, + "learning_rate": 0.00014724672228843863, + "loss": 0.8521, + "mean_token_accuracy": 0.7424706399440766, + "num_tokens": 66563600.0, + "step": 28770 + }, + { + "epoch": 0.26386724122123406, + "learning_rate": 0.00014722838544054277, + "loss": 0.8647, + "mean_token_accuracy": 0.7430243372917176, + "num_tokens": 66586069.0, + "step": 28780 + }, + { + "epoch": 0.2639589254607133, + "learning_rate": 0.00014721004859264694, + "loss": 0.8666, + "mean_token_accuracy": 0.7367045223712921, + "num_tokens": 66609021.0, + "step": 28790 + }, + { + "epoch": 0.26405060970019256, + "learning_rate": 0.00014719171174475108, + "loss": 0.8668, + "mean_token_accuracy": 0.741569983959198, + "num_tokens": 66631758.0, + "step": 28800 + }, + { + "epoch": 0.26414229393967176, + "learning_rate": 0.00014717337489685524, + "loss": 0.8512, + "mean_token_accuracy": 0.7436561405658721, + "num_tokens": 66654784.0, + "step": 28810 + }, + { + "epoch": 0.264233978179151, + "learning_rate": 0.00014715503804895938, + "loss": 0.8296, + "mean_token_accuracy": 0.748553729057312, + "num_tokens": 66677839.0, + "step": 28820 + }, + { + "epoch": 0.26432566241863026, + "learning_rate": 0.00014713670120106354, + "loss": 0.8694, + "mean_token_accuracy": 0.7424539923667908, + "num_tokens": 66699875.0, + "step": 28830 + }, + { + "epoch": 0.26441734665810945, + "learning_rate": 0.0001471183643531677, + "loss": 0.8606, + "mean_token_accuracy": 0.7472703456878662, + "num_tokens": 66722994.0, + "step": 28840 + }, + { + "epoch": 0.2645090308975887, + "learning_rate": 0.00014710002750527185, + "loss": 0.8634, + "mean_token_accuracy": 0.7443240582942963, + "num_tokens": 66745235.0, + "step": 28850 + }, + { + "epoch": 0.26460071513706795, + "learning_rate": 0.000147081690657376, + "loss": 0.8552, + "mean_token_accuracy": 0.7454345524311066, + "num_tokens": 66768823.0, + "step": 28860 + }, + { + "epoch": 0.26469239937654715, + "learning_rate": 0.00014706335380948015, + "loss": 0.8453, + "mean_token_accuracy": 0.7457144618034363, + "num_tokens": 66791689.0, + "step": 28870 + }, + { + "epoch": 0.2647840836160264, + "learning_rate": 0.0001470450169615843, + "loss": 0.906, + "mean_token_accuracy": 0.7367794573307037, + "num_tokens": 66814321.0, + "step": 28880 + }, + { + "epoch": 0.26487576785550565, + "learning_rate": 0.00014702668011368846, + "loss": 0.8623, + "mean_token_accuracy": 0.7381490409374237, + "num_tokens": 66837741.0, + "step": 28890 + }, + { + "epoch": 0.26496745209498485, + "learning_rate": 0.00014700834326579262, + "loss": 0.8665, + "mean_token_accuracy": 0.7440053343772888, + "num_tokens": 66860678.0, + "step": 28900 + }, + { + "epoch": 0.2650591363344641, + "learning_rate": 0.00014699000641789679, + "loss": 0.8606, + "mean_token_accuracy": 0.7494698226451874, + "num_tokens": 66883296.0, + "step": 28910 + }, + { + "epoch": 0.26515082057394335, + "learning_rate": 0.00014697166957000092, + "loss": 0.8732, + "mean_token_accuracy": 0.7404204905033112, + "num_tokens": 66906013.0, + "step": 28920 + }, + { + "epoch": 0.2652425048134226, + "learning_rate": 0.00014695333272210506, + "loss": 0.8465, + "mean_token_accuracy": 0.7487307369709015, + "num_tokens": 66928597.0, + "step": 28930 + }, + { + "epoch": 0.2653341890529018, + "learning_rate": 0.00014693499587420923, + "loss": 0.8337, + "mean_token_accuracy": 0.7548036456108094, + "num_tokens": 66952014.0, + "step": 28940 + }, + { + "epoch": 0.26542587329238104, + "learning_rate": 0.00014691665902631337, + "loss": 0.8708, + "mean_token_accuracy": 0.7427916049957275, + "num_tokens": 66974983.0, + "step": 28950 + }, + { + "epoch": 0.2655175575318603, + "learning_rate": 0.00014689832217841756, + "loss": 0.8443, + "mean_token_accuracy": 0.7510434329509735, + "num_tokens": 66997248.0, + "step": 28960 + }, + { + "epoch": 0.2656092417713395, + "learning_rate": 0.0001468799853305217, + "loss": 0.837, + "mean_token_accuracy": 0.7415893733501434, + "num_tokens": 67019587.0, + "step": 28970 + }, + { + "epoch": 0.26570092601081874, + "learning_rate": 0.00014686164848262584, + "loss": 0.8838, + "mean_token_accuracy": 0.7404287934303284, + "num_tokens": 67042656.0, + "step": 28980 + }, + { + "epoch": 0.265792610250298, + "learning_rate": 0.00014684331163473, + "loss": 0.8627, + "mean_token_accuracy": 0.7427705228328705, + "num_tokens": 67064991.0, + "step": 28990 + }, + { + "epoch": 0.2658842944897772, + "learning_rate": 0.00014682497478683414, + "loss": 0.867, + "mean_token_accuracy": 0.7465137422084809, + "num_tokens": 67088364.0, + "step": 29000 + }, + { + "epoch": 0.26597597872925643, + "learning_rate": 0.0001468066379389383, + "loss": 0.8498, + "mean_token_accuracy": 0.7433292806148529, + "num_tokens": 67111344.0, + "step": 29010 + }, + { + "epoch": 0.2660676629687357, + "learning_rate": 0.00014678830109104244, + "loss": 0.8315, + "mean_token_accuracy": 0.7543451845645904, + "num_tokens": 67134783.0, + "step": 29020 + }, + { + "epoch": 0.2661593472082149, + "learning_rate": 0.0001467699642431466, + "loss": 0.8595, + "mean_token_accuracy": 0.7442370295524597, + "num_tokens": 67158060.0, + "step": 29030 + }, + { + "epoch": 0.26625103144769413, + "learning_rate": 0.00014675162739525077, + "loss": 0.8478, + "mean_token_accuracy": 0.7446286261081696, + "num_tokens": 67182099.0, + "step": 29040 + }, + { + "epoch": 0.2663427156871734, + "learning_rate": 0.0001467332905473549, + "loss": 0.8602, + "mean_token_accuracy": 0.7392730414867401, + "num_tokens": 67205297.0, + "step": 29050 + }, + { + "epoch": 0.26643439992665263, + "learning_rate": 0.00014671495369945908, + "loss": 0.8619, + "mean_token_accuracy": 0.7441462278366089, + "num_tokens": 67227530.0, + "step": 29060 + }, + { + "epoch": 0.2665260841661318, + "learning_rate": 0.00014669661685156322, + "loss": 0.8509, + "mean_token_accuracy": 0.752511179447174, + "num_tokens": 67250416.0, + "step": 29070 + }, + { + "epoch": 0.2666177684056111, + "learning_rate": 0.00014667828000366735, + "loss": 0.8649, + "mean_token_accuracy": 0.7423738956451416, + "num_tokens": 67273483.0, + "step": 29080 + }, + { + "epoch": 0.26670945264509033, + "learning_rate": 0.00014665994315577155, + "loss": 0.888, + "mean_token_accuracy": 0.7406603693962097, + "num_tokens": 67296409.0, + "step": 29090 + }, + { + "epoch": 0.2668011368845695, + "learning_rate": 0.00014664160630787569, + "loss": 0.861, + "mean_token_accuracy": 0.7430307030677795, + "num_tokens": 67320120.0, + "step": 29100 + }, + { + "epoch": 0.2668928211240488, + "learning_rate": 0.00014662326945997985, + "loss": 0.8729, + "mean_token_accuracy": 0.7388255298137665, + "num_tokens": 67342508.0, + "step": 29110 + }, + { + "epoch": 0.266984505363528, + "learning_rate": 0.000146604932612084, + "loss": 0.8512, + "mean_token_accuracy": 0.7403953552246094, + "num_tokens": 67366231.0, + "step": 29120 + }, + { + "epoch": 0.2670761896030072, + "learning_rate": 0.00014658659576418813, + "loss": 0.845, + "mean_token_accuracy": 0.7455290079116821, + "num_tokens": 67389728.0, + "step": 29130 + }, + { + "epoch": 0.26716787384248647, + "learning_rate": 0.0001465682589162923, + "loss": 0.8545, + "mean_token_accuracy": 0.7436563789844512, + "num_tokens": 67411895.0, + "step": 29140 + }, + { + "epoch": 0.2672595580819657, + "learning_rate": 0.00014654992206839643, + "loss": 0.858, + "mean_token_accuracy": 0.7372546017169952, + "num_tokens": 67435493.0, + "step": 29150 + }, + { + "epoch": 0.26735124232144497, + "learning_rate": 0.00014653158522050062, + "loss": 0.9159, + "mean_token_accuracy": 0.7308765232563019, + "num_tokens": 67458961.0, + "step": 29160 + }, + { + "epoch": 0.26744292656092417, + "learning_rate": 0.00014651324837260476, + "loss": 0.8537, + "mean_token_accuracy": 0.7504374504089355, + "num_tokens": 67481489.0, + "step": 29170 + }, + { + "epoch": 0.2675346108004034, + "learning_rate": 0.0001464949115247089, + "loss": 0.8749, + "mean_token_accuracy": 0.7418615996837616, + "num_tokens": 67504256.0, + "step": 29180 + }, + { + "epoch": 0.26762629503988267, + "learning_rate": 0.00014647657467681307, + "loss": 0.8883, + "mean_token_accuracy": 0.7359951794147491, + "num_tokens": 67527126.0, + "step": 29190 + }, + { + "epoch": 0.26771797927936186, + "learning_rate": 0.0001464582378289172, + "loss": 0.8367, + "mean_token_accuracy": 0.746992540359497, + "num_tokens": 67550006.0, + "step": 29200 + }, + { + "epoch": 0.2678096635188411, + "learning_rate": 0.00014643990098102137, + "loss": 0.8372, + "mean_token_accuracy": 0.742882889509201, + "num_tokens": 67573479.0, + "step": 29210 + }, + { + "epoch": 0.26790134775832036, + "learning_rate": 0.00014642156413312553, + "loss": 0.8936, + "mean_token_accuracy": 0.7388453662395478, + "num_tokens": 67596265.0, + "step": 29220 + }, + { + "epoch": 0.26799303199779956, + "learning_rate": 0.00014640322728522967, + "loss": 0.8482, + "mean_token_accuracy": 0.750929081439972, + "num_tokens": 67619372.0, + "step": 29230 + }, + { + "epoch": 0.2680847162372788, + "learning_rate": 0.00014638489043733384, + "loss": 0.8274, + "mean_token_accuracy": 0.7511480689048767, + "num_tokens": 67642384.0, + "step": 29240 + }, + { + "epoch": 0.26817640047675806, + "learning_rate": 0.00014636655358943798, + "loss": 0.8599, + "mean_token_accuracy": 0.7407106041908265, + "num_tokens": 67665331.0, + "step": 29250 + }, + { + "epoch": 0.26826808471623725, + "learning_rate": 0.00014634821674154214, + "loss": 0.8586, + "mean_token_accuracy": 0.7456808745861053, + "num_tokens": 67688857.0, + "step": 29260 + }, + { + "epoch": 0.2683597689557165, + "learning_rate": 0.00014632987989364628, + "loss": 0.8359, + "mean_token_accuracy": 0.7532157719135284, + "num_tokens": 67711592.0, + "step": 29270 + }, + { + "epoch": 0.26845145319519575, + "learning_rate": 0.00014631154304575042, + "loss": 0.8353, + "mean_token_accuracy": 0.7491818904876709, + "num_tokens": 67733929.0, + "step": 29280 + }, + { + "epoch": 0.268543137434675, + "learning_rate": 0.0001462932061978546, + "loss": 0.8838, + "mean_token_accuracy": 0.746704387664795, + "num_tokens": 67757078.0, + "step": 29290 + }, + { + "epoch": 0.2686348216741542, + "learning_rate": 0.00014627486934995875, + "loss": 0.9128, + "mean_token_accuracy": 0.736178743839264, + "num_tokens": 67780851.0, + "step": 29300 + }, + { + "epoch": 0.26872650591363345, + "learning_rate": 0.00014625653250206292, + "loss": 0.8629, + "mean_token_accuracy": 0.7438143193721771, + "num_tokens": 67803841.0, + "step": 29310 + }, + { + "epoch": 0.2688181901531127, + "learning_rate": 0.00014623819565416705, + "loss": 0.8135, + "mean_token_accuracy": 0.7553632915019989, + "num_tokens": 67826609.0, + "step": 29320 + }, + { + "epoch": 0.2689098743925919, + "learning_rate": 0.0001462198588062712, + "loss": 0.8803, + "mean_token_accuracy": 0.7446336030960083, + "num_tokens": 67849713.0, + "step": 29330 + }, + { + "epoch": 0.26900155863207115, + "learning_rate": 0.00014620152195837536, + "loss": 0.829, + "mean_token_accuracy": 0.7467943906784058, + "num_tokens": 67872427.0, + "step": 29340 + }, + { + "epoch": 0.2690932428715504, + "learning_rate": 0.00014618318511047952, + "loss": 0.8214, + "mean_token_accuracy": 0.7474032640457153, + "num_tokens": 67895742.0, + "step": 29350 + }, + { + "epoch": 0.2691849271110296, + "learning_rate": 0.0001461648482625837, + "loss": 0.867, + "mean_token_accuracy": 0.7436695754528045, + "num_tokens": 67918365.0, + "step": 29360 + }, + { + "epoch": 0.26927661135050884, + "learning_rate": 0.00014614651141468783, + "loss": 0.8598, + "mean_token_accuracy": 0.7457526862621308, + "num_tokens": 67941987.0, + "step": 29370 + }, + { + "epoch": 0.2693682955899881, + "learning_rate": 0.00014612817456679196, + "loss": 0.8305, + "mean_token_accuracy": 0.7480398297309876, + "num_tokens": 67963766.0, + "step": 29380 + }, + { + "epoch": 0.2694599798294673, + "learning_rate": 0.00014610983771889613, + "loss": 0.8155, + "mean_token_accuracy": 0.7545328974723816, + "num_tokens": 67986842.0, + "step": 29390 + }, + { + "epoch": 0.26955166406894654, + "learning_rate": 0.00014609150087100027, + "loss": 0.8369, + "mean_token_accuracy": 0.7504626631736755, + "num_tokens": 68010395.0, + "step": 29400 + }, + { + "epoch": 0.2696433483084258, + "learning_rate": 0.00014607316402310443, + "loss": 0.8416, + "mean_token_accuracy": 0.7495385110378265, + "num_tokens": 68033735.0, + "step": 29410 + }, + { + "epoch": 0.26973503254790504, + "learning_rate": 0.0001460548271752086, + "loss": 0.9072, + "mean_token_accuracy": 0.7287107169628143, + "num_tokens": 68056965.0, + "step": 29420 + }, + { + "epoch": 0.26982671678738424, + "learning_rate": 0.00014603649032731274, + "loss": 0.8701, + "mean_token_accuracy": 0.7426390469074249, + "num_tokens": 68079781.0, + "step": 29430 + }, + { + "epoch": 0.2699184010268635, + "learning_rate": 0.0001460181534794169, + "loss": 0.8716, + "mean_token_accuracy": 0.7354677617549896, + "num_tokens": 68102197.0, + "step": 29440 + }, + { + "epoch": 0.27001008526634274, + "learning_rate": 0.00014599981663152104, + "loss": 0.8747, + "mean_token_accuracy": 0.7406946778297424, + "num_tokens": 68125530.0, + "step": 29450 + }, + { + "epoch": 0.27010176950582193, + "learning_rate": 0.0001459814797836252, + "loss": 0.8222, + "mean_token_accuracy": 0.749953418970108, + "num_tokens": 68148332.0, + "step": 29460 + }, + { + "epoch": 0.2701934537453012, + "learning_rate": 0.00014596314293572935, + "loss": 0.8235, + "mean_token_accuracy": 0.7534517705440521, + "num_tokens": 68171579.0, + "step": 29470 + }, + { + "epoch": 0.27028513798478043, + "learning_rate": 0.0001459448060878335, + "loss": 0.8509, + "mean_token_accuracy": 0.7438921391963959, + "num_tokens": 68195314.0, + "step": 29480 + }, + { + "epoch": 0.2703768222242596, + "learning_rate": 0.00014592646923993768, + "loss": 0.8843, + "mean_token_accuracy": 0.7390227317810059, + "num_tokens": 68218487.0, + "step": 29490 + }, + { + "epoch": 0.2704685064637389, + "learning_rate": 0.00014590813239204181, + "loss": 0.8721, + "mean_token_accuracy": 0.7434373795986176, + "num_tokens": 68242370.0, + "step": 29500 + }, + { + "epoch": 0.27056019070321813, + "learning_rate": 0.00014588979554414598, + "loss": 0.833, + "mean_token_accuracy": 0.7449617803096771, + "num_tokens": 68265183.0, + "step": 29510 + }, + { + "epoch": 0.2706518749426973, + "learning_rate": 0.00014587145869625012, + "loss": 0.8058, + "mean_token_accuracy": 0.755420982837677, + "num_tokens": 68287846.0, + "step": 29520 + }, + { + "epoch": 0.2707435591821766, + "learning_rate": 0.00014585312184835426, + "loss": 0.8157, + "mean_token_accuracy": 0.7547839224338532, + "num_tokens": 68311104.0, + "step": 29530 + }, + { + "epoch": 0.2708352434216558, + "learning_rate": 0.00014583478500045842, + "loss": 0.8393, + "mean_token_accuracy": 0.7439712226390839, + "num_tokens": 68334408.0, + "step": 29540 + }, + { + "epoch": 0.2709269276611351, + "learning_rate": 0.0001458164481525626, + "loss": 0.8527, + "mean_token_accuracy": 0.7445021390914917, + "num_tokens": 68357512.0, + "step": 29550 + }, + { + "epoch": 0.27101861190061427, + "learning_rate": 0.00014579811130466675, + "loss": 0.8511, + "mean_token_accuracy": 0.7417372643947602, + "num_tokens": 68381227.0, + "step": 29560 + }, + { + "epoch": 0.2711102961400935, + "learning_rate": 0.0001457797744567709, + "loss": 0.8108, + "mean_token_accuracy": 0.7528151869773865, + "num_tokens": 68403866.0, + "step": 29570 + }, + { + "epoch": 0.27120198037957277, + "learning_rate": 0.00014576143760887503, + "loss": 0.8788, + "mean_token_accuracy": 0.745859557390213, + "num_tokens": 68426608.0, + "step": 29580 + }, + { + "epoch": 0.27129366461905197, + "learning_rate": 0.0001457431007609792, + "loss": 0.8505, + "mean_token_accuracy": 0.7478248178958893, + "num_tokens": 68449694.0, + "step": 29590 + }, + { + "epoch": 0.2713853488585312, + "learning_rate": 0.00014572476391308333, + "loss": 0.8461, + "mean_token_accuracy": 0.7508221387863159, + "num_tokens": 68472316.0, + "step": 29600 + }, + { + "epoch": 0.27147703309801047, + "learning_rate": 0.0001457064270651875, + "loss": 0.8502, + "mean_token_accuracy": 0.7456076145172119, + "num_tokens": 68494968.0, + "step": 29610 + }, + { + "epoch": 0.27156871733748966, + "learning_rate": 0.00014568809021729166, + "loss": 0.8447, + "mean_token_accuracy": 0.747329032421112, + "num_tokens": 68517740.0, + "step": 29620 + }, + { + "epoch": 0.2716604015769689, + "learning_rate": 0.0001456697533693958, + "loss": 0.8425, + "mean_token_accuracy": 0.7470325529575348, + "num_tokens": 68540265.0, + "step": 29630 + }, + { + "epoch": 0.27175208581644816, + "learning_rate": 0.00014565141652149997, + "loss": 0.8355, + "mean_token_accuracy": 0.7455933690071106, + "num_tokens": 68563435.0, + "step": 29640 + }, + { + "epoch": 0.27184377005592736, + "learning_rate": 0.0001456330796736041, + "loss": 0.8221, + "mean_token_accuracy": 0.7530646741390228, + "num_tokens": 68587537.0, + "step": 29650 + }, + { + "epoch": 0.2719354542954066, + "learning_rate": 0.00014561474282570827, + "loss": 0.8706, + "mean_token_accuracy": 0.7441581964492798, + "num_tokens": 68610865.0, + "step": 29660 + }, + { + "epoch": 0.27202713853488586, + "learning_rate": 0.0001455964059778124, + "loss": 0.8854, + "mean_token_accuracy": 0.729330575466156, + "num_tokens": 68633724.0, + "step": 29670 + }, + { + "epoch": 0.2721188227743651, + "learning_rate": 0.00014557806912991657, + "loss": 0.8566, + "mean_token_accuracy": 0.7444162905216217, + "num_tokens": 68656674.0, + "step": 29680 + }, + { + "epoch": 0.2722105070138443, + "learning_rate": 0.00014555973228202074, + "loss": 0.8456, + "mean_token_accuracy": 0.7447042107582093, + "num_tokens": 68680344.0, + "step": 29690 + }, + { + "epoch": 0.27230219125332356, + "learning_rate": 0.00014554139543412488, + "loss": 0.8614, + "mean_token_accuracy": 0.7424675345420837, + "num_tokens": 68703847.0, + "step": 29700 + }, + { + "epoch": 0.2723938754928028, + "learning_rate": 0.00014552305858622904, + "loss": 0.8795, + "mean_token_accuracy": 0.7416525959968567, + "num_tokens": 68726794.0, + "step": 29710 + }, + { + "epoch": 0.272485559732282, + "learning_rate": 0.00014550472173833318, + "loss": 0.8345, + "mean_token_accuracy": 0.7532901585102081, + "num_tokens": 68749658.0, + "step": 29720 + }, + { + "epoch": 0.27257724397176125, + "learning_rate": 0.00014548638489043732, + "loss": 0.8869, + "mean_token_accuracy": 0.7452648997306823, + "num_tokens": 68772465.0, + "step": 29730 + }, + { + "epoch": 0.2726689282112405, + "learning_rate": 0.0001454680480425415, + "loss": 0.894, + "mean_token_accuracy": 0.737343817949295, + "num_tokens": 68795707.0, + "step": 29740 + }, + { + "epoch": 0.2727606124507197, + "learning_rate": 0.00014544971119464565, + "loss": 0.8197, + "mean_token_accuracy": 0.7482154846191407, + "num_tokens": 68818929.0, + "step": 29750 + }, + { + "epoch": 0.27285229669019895, + "learning_rate": 0.00014543137434674982, + "loss": 0.828, + "mean_token_accuracy": 0.7502427756786346, + "num_tokens": 68841705.0, + "step": 29760 + }, + { + "epoch": 0.2729439809296782, + "learning_rate": 0.00014541303749885396, + "loss": 0.8427, + "mean_token_accuracy": 0.7512379825115204, + "num_tokens": 68864949.0, + "step": 29770 + }, + { + "epoch": 0.27303566516915745, + "learning_rate": 0.0001453947006509581, + "loss": 0.9004, + "mean_token_accuracy": 0.7296261727809906, + "num_tokens": 68888372.0, + "step": 29780 + }, + { + "epoch": 0.27312734940863664, + "learning_rate": 0.00014537636380306226, + "loss": 0.8255, + "mean_token_accuracy": 0.7524441063404084, + "num_tokens": 68911681.0, + "step": 29790 + }, + { + "epoch": 0.2732190336481159, + "learning_rate": 0.0001453580269551664, + "loss": 0.8377, + "mean_token_accuracy": 0.7447475910186767, + "num_tokens": 68934440.0, + "step": 29800 + }, + { + "epoch": 0.27331071788759514, + "learning_rate": 0.0001453396901072706, + "loss": 0.9117, + "mean_token_accuracy": 0.7330490410327911, + "num_tokens": 68957962.0, + "step": 29810 + }, + { + "epoch": 0.27340240212707434, + "learning_rate": 0.00014532135325937473, + "loss": 0.8504, + "mean_token_accuracy": 0.7409867823123932, + "num_tokens": 68982125.0, + "step": 29820 + }, + { + "epoch": 0.2734940863665536, + "learning_rate": 0.00014530301641147887, + "loss": 0.8472, + "mean_token_accuracy": 0.7477595150470734, + "num_tokens": 69005424.0, + "step": 29830 + }, + { + "epoch": 0.27358577060603284, + "learning_rate": 0.00014528467956358303, + "loss": 0.8487, + "mean_token_accuracy": 0.7439844191074372, + "num_tokens": 69028157.0, + "step": 29840 + }, + { + "epoch": 0.27367745484551204, + "learning_rate": 0.00014526634271568717, + "loss": 0.7956, + "mean_token_accuracy": 0.7536679446697235, + "num_tokens": 69051438.0, + "step": 29850 + }, + { + "epoch": 0.2737691390849913, + "learning_rate": 0.00014524800586779134, + "loss": 0.8545, + "mean_token_accuracy": 0.7462322473526001, + "num_tokens": 69074184.0, + "step": 29860 + }, + { + "epoch": 0.27386082332447054, + "learning_rate": 0.0001452296690198955, + "loss": 0.8447, + "mean_token_accuracy": 0.7494982481002808, + "num_tokens": 69096820.0, + "step": 29870 + }, + { + "epoch": 0.27395250756394973, + "learning_rate": 0.00014521133217199964, + "loss": 0.8507, + "mean_token_accuracy": 0.7408902049064636, + "num_tokens": 69119900.0, + "step": 29880 + }, + { + "epoch": 0.274044191803429, + "learning_rate": 0.0001451929953241038, + "loss": 0.8554, + "mean_token_accuracy": 0.744701224565506, + "num_tokens": 69143006.0, + "step": 29890 + }, + { + "epoch": 0.27413587604290823, + "learning_rate": 0.00014517465847620794, + "loss": 0.8518, + "mean_token_accuracy": 0.746039605140686, + "num_tokens": 69166044.0, + "step": 29900 + }, + { + "epoch": 0.2742275602823875, + "learning_rate": 0.0001451563216283121, + "loss": 0.8569, + "mean_token_accuracy": 0.7490433156490326, + "num_tokens": 69188816.0, + "step": 29910 + }, + { + "epoch": 0.2743192445218667, + "learning_rate": 0.00014513798478041625, + "loss": 0.8696, + "mean_token_accuracy": 0.7380292892456055, + "num_tokens": 69211601.0, + "step": 29920 + }, + { + "epoch": 0.27441092876134593, + "learning_rate": 0.00014511964793252039, + "loss": 0.8344, + "mean_token_accuracy": 0.7535680830478668, + "num_tokens": 69234842.0, + "step": 29930 + }, + { + "epoch": 0.2745026130008252, + "learning_rate": 0.00014510131108462458, + "loss": 0.8517, + "mean_token_accuracy": 0.7445323169231415, + "num_tokens": 69257837.0, + "step": 29940 + }, + { + "epoch": 0.2745942972403044, + "learning_rate": 0.00014508297423672872, + "loss": 0.8413, + "mean_token_accuracy": 0.7428589642047883, + "num_tokens": 69281484.0, + "step": 29950 + }, + { + "epoch": 0.2746859814797836, + "learning_rate": 0.00014506463738883288, + "loss": 0.8465, + "mean_token_accuracy": 0.7460168719291687, + "num_tokens": 69304230.0, + "step": 29960 + }, + { + "epoch": 0.2747776657192629, + "learning_rate": 0.00014504630054093702, + "loss": 0.8601, + "mean_token_accuracy": 0.7441195726394654, + "num_tokens": 69326555.0, + "step": 29970 + }, + { + "epoch": 0.27486934995874207, + "learning_rate": 0.00014502796369304116, + "loss": 0.8582, + "mean_token_accuracy": 0.7398589491844177, + "num_tokens": 69350255.0, + "step": 29980 + }, + { + "epoch": 0.2749610341982213, + "learning_rate": 0.00014500962684514532, + "loss": 0.9022, + "mean_token_accuracy": 0.7317766427993775, + "num_tokens": 69372911.0, + "step": 29990 + }, + { + "epoch": 0.27505271843770057, + "learning_rate": 0.00014499128999724946, + "loss": 0.8936, + "mean_token_accuracy": 0.7391605913639069, + "num_tokens": 69395940.0, + "step": 30000 + }, + { + "epoch": 0.27514440267717977, + "learning_rate": 0.00014497295314935365, + "loss": 0.9062, + "mean_token_accuracy": 0.7369853496551514, + "num_tokens": 69419661.0, + "step": 30010 + }, + { + "epoch": 0.275236086916659, + "learning_rate": 0.0001449546163014578, + "loss": 0.8753, + "mean_token_accuracy": 0.7369670629501343, + "num_tokens": 69442493.0, + "step": 30020 + }, + { + "epoch": 0.27532777115613827, + "learning_rate": 0.00014493627945356193, + "loss": 0.8738, + "mean_token_accuracy": 0.7404657423496246, + "num_tokens": 69464509.0, + "step": 30030 + }, + { + "epoch": 0.2754194553956175, + "learning_rate": 0.0001449179426056661, + "loss": 0.8409, + "mean_token_accuracy": 0.7477413415908813, + "num_tokens": 69487946.0, + "step": 30040 + }, + { + "epoch": 0.2755111396350967, + "learning_rate": 0.00014489960575777023, + "loss": 0.8618, + "mean_token_accuracy": 0.7451659798622131, + "num_tokens": 69510802.0, + "step": 30050 + }, + { + "epoch": 0.27560282387457596, + "learning_rate": 0.0001448812689098744, + "loss": 0.8637, + "mean_token_accuracy": 0.7422425389289856, + "num_tokens": 69533141.0, + "step": 30060 + }, + { + "epoch": 0.2756945081140552, + "learning_rate": 0.00014486293206197857, + "loss": 0.8407, + "mean_token_accuracy": 0.748996478319168, + "num_tokens": 69556322.0, + "step": 30070 + }, + { + "epoch": 0.2757861923535344, + "learning_rate": 0.0001448445952140827, + "loss": 0.85, + "mean_token_accuracy": 0.7472386837005616, + "num_tokens": 69579630.0, + "step": 30080 + }, + { + "epoch": 0.27587787659301366, + "learning_rate": 0.00014482625836618687, + "loss": 0.841, + "mean_token_accuracy": 0.7489966690540314, + "num_tokens": 69603221.0, + "step": 30090 + }, + { + "epoch": 0.2759695608324929, + "learning_rate": 0.000144807921518291, + "loss": 0.8907, + "mean_token_accuracy": 0.7398915767669678, + "num_tokens": 69626369.0, + "step": 30100 + }, + { + "epoch": 0.2760612450719721, + "learning_rate": 0.00014478958467039517, + "loss": 0.8266, + "mean_token_accuracy": 0.7532822728157044, + "num_tokens": 69649118.0, + "step": 30110 + }, + { + "epoch": 0.27615292931145136, + "learning_rate": 0.0001447712478224993, + "loss": 0.8502, + "mean_token_accuracy": 0.7412570297718049, + "num_tokens": 69671698.0, + "step": 30120 + }, + { + "epoch": 0.2762446135509306, + "learning_rate": 0.00014475291097460345, + "loss": 0.8868, + "mean_token_accuracy": 0.7416863083839417, + "num_tokens": 69694071.0, + "step": 30130 + }, + { + "epoch": 0.2763362977904098, + "learning_rate": 0.00014473457412670764, + "loss": 0.8427, + "mean_token_accuracy": 0.7469041466712951, + "num_tokens": 69716804.0, + "step": 30140 + }, + { + "epoch": 0.27642798202988905, + "learning_rate": 0.00014471623727881178, + "loss": 0.8594, + "mean_token_accuracy": 0.7424174904823303, + "num_tokens": 69739564.0, + "step": 30150 + }, + { + "epoch": 0.2765196662693683, + "learning_rate": 0.00014469790043091595, + "loss": 0.8536, + "mean_token_accuracy": 0.7470351040363312, + "num_tokens": 69762953.0, + "step": 30160 + }, + { + "epoch": 0.27661135050884755, + "learning_rate": 0.00014467956358302008, + "loss": 0.847, + "mean_token_accuracy": 0.7427092969417572, + "num_tokens": 69786264.0, + "step": 30170 + }, + { + "epoch": 0.27670303474832675, + "learning_rate": 0.00014466122673512422, + "loss": 0.8849, + "mean_token_accuracy": 0.7354965507984161, + "num_tokens": 69809539.0, + "step": 30180 + }, + { + "epoch": 0.276794718987806, + "learning_rate": 0.0001446428898872284, + "loss": 0.8127, + "mean_token_accuracy": 0.7516207277774811, + "num_tokens": 69832795.0, + "step": 30190 + }, + { + "epoch": 0.27688640322728525, + "learning_rate": 0.00014462455303933255, + "loss": 0.8366, + "mean_token_accuracy": 0.7521384298801422, + "num_tokens": 69855803.0, + "step": 30200 + }, + { + "epoch": 0.27697808746676444, + "learning_rate": 0.00014460621619143672, + "loss": 0.8735, + "mean_token_accuracy": 0.7349007666110993, + "num_tokens": 69879872.0, + "step": 30210 + }, + { + "epoch": 0.2770697717062437, + "learning_rate": 0.00014458787934354086, + "loss": 0.8686, + "mean_token_accuracy": 0.7428090989589691, + "num_tokens": 69903014.0, + "step": 30220 + }, + { + "epoch": 0.27716145594572295, + "learning_rate": 0.000144569542495645, + "loss": 0.8473, + "mean_token_accuracy": 0.7449588358402253, + "num_tokens": 69926856.0, + "step": 30230 + }, + { + "epoch": 0.27725314018520214, + "learning_rate": 0.00014455120564774916, + "loss": 0.8619, + "mean_token_accuracy": 0.7457121670246124, + "num_tokens": 69949635.0, + "step": 30240 + }, + { + "epoch": 0.2773448244246814, + "learning_rate": 0.0001445328687998533, + "loss": 0.853, + "mean_token_accuracy": 0.7396000623703003, + "num_tokens": 69972313.0, + "step": 30250 + }, + { + "epoch": 0.27743650866416064, + "learning_rate": 0.00014451453195195746, + "loss": 0.813, + "mean_token_accuracy": 0.7499053537845611, + "num_tokens": 69995105.0, + "step": 30260 + }, + { + "epoch": 0.2775281929036399, + "learning_rate": 0.00014449619510406163, + "loss": 0.8618, + "mean_token_accuracy": 0.7377649426460267, + "num_tokens": 70018594.0, + "step": 30270 + }, + { + "epoch": 0.2776198771431191, + "learning_rate": 0.00014447785825616577, + "loss": 0.8321, + "mean_token_accuracy": 0.753245210647583, + "num_tokens": 70041959.0, + "step": 30280 + }, + { + "epoch": 0.27771156138259834, + "learning_rate": 0.00014445952140826993, + "loss": 0.8702, + "mean_token_accuracy": 0.7458824634552002, + "num_tokens": 70064932.0, + "step": 30290 + }, + { + "epoch": 0.2778032456220776, + "learning_rate": 0.00014444118456037407, + "loss": 0.8276, + "mean_token_accuracy": 0.7527470052242279, + "num_tokens": 70087530.0, + "step": 30300 + }, + { + "epoch": 0.2778949298615568, + "learning_rate": 0.00014442284771247824, + "loss": 0.8575, + "mean_token_accuracy": 0.7428588151931763, + "num_tokens": 70111207.0, + "step": 30310 + }, + { + "epoch": 0.27798661410103603, + "learning_rate": 0.00014440451086458238, + "loss": 0.8442, + "mean_token_accuracy": 0.7492354273796081, + "num_tokens": 70133716.0, + "step": 30320 + }, + { + "epoch": 0.2780782983405153, + "learning_rate": 0.00014438617401668654, + "loss": 0.8378, + "mean_token_accuracy": 0.7398899555206299, + "num_tokens": 70156836.0, + "step": 30330 + }, + { + "epoch": 0.2781699825799945, + "learning_rate": 0.0001443678371687907, + "loss": 0.8777, + "mean_token_accuracy": 0.7388945102691651, + "num_tokens": 70179296.0, + "step": 30340 + }, + { + "epoch": 0.27826166681947373, + "learning_rate": 0.00014434950032089484, + "loss": 0.8441, + "mean_token_accuracy": 0.7435081481933594, + "num_tokens": 70202823.0, + "step": 30350 + }, + { + "epoch": 0.278353351058953, + "learning_rate": 0.000144331163472999, + "loss": 0.8823, + "mean_token_accuracy": 0.7377229452133178, + "num_tokens": 70226026.0, + "step": 30360 + }, + { + "epoch": 0.2784450352984322, + "learning_rate": 0.00014431282662510315, + "loss": 0.8192, + "mean_token_accuracy": 0.7503212690353394, + "num_tokens": 70249365.0, + "step": 30370 + }, + { + "epoch": 0.2785367195379114, + "learning_rate": 0.0001442944897772073, + "loss": 0.8929, + "mean_token_accuracy": 0.729200690984726, + "num_tokens": 70272518.0, + "step": 30380 + }, + { + "epoch": 0.2786284037773907, + "learning_rate": 0.00014427615292931145, + "loss": 0.8414, + "mean_token_accuracy": 0.7466009974479675, + "num_tokens": 70296084.0, + "step": 30390 + }, + { + "epoch": 0.2787200880168699, + "learning_rate": 0.00014425781608141562, + "loss": 0.81, + "mean_token_accuracy": 0.7537119925022125, + "num_tokens": 70319467.0, + "step": 30400 + }, + { + "epoch": 0.2788117722563491, + "learning_rate": 0.00014423947923351978, + "loss": 0.9073, + "mean_token_accuracy": 0.7421898543834686, + "num_tokens": 70342795.0, + "step": 30410 + }, + { + "epoch": 0.2789034564958284, + "learning_rate": 0.00014422114238562392, + "loss": 0.8277, + "mean_token_accuracy": 0.7475308477878571, + "num_tokens": 70366224.0, + "step": 30420 + }, + { + "epoch": 0.2789951407353076, + "learning_rate": 0.00014420280553772806, + "loss": 0.841, + "mean_token_accuracy": 0.751807564496994, + "num_tokens": 70389878.0, + "step": 30430 + }, + { + "epoch": 0.2790868249747868, + "learning_rate": 0.00014418446868983223, + "loss": 0.8571, + "mean_token_accuracy": 0.7408379077911377, + "num_tokens": 70413175.0, + "step": 30440 + }, + { + "epoch": 0.27917850921426607, + "learning_rate": 0.00014416613184193636, + "loss": 0.8473, + "mean_token_accuracy": 0.7510758996009826, + "num_tokens": 70436352.0, + "step": 30450 + }, + { + "epoch": 0.2792701934537453, + "learning_rate": 0.00014414779499404053, + "loss": 0.8255, + "mean_token_accuracy": 0.7521364748477936, + "num_tokens": 70459425.0, + "step": 30460 + }, + { + "epoch": 0.2793618776932245, + "learning_rate": 0.0001441294581461447, + "loss": 0.871, + "mean_token_accuracy": 0.744724178314209, + "num_tokens": 70482852.0, + "step": 30470 + }, + { + "epoch": 0.27945356193270376, + "learning_rate": 0.00014411112129824883, + "loss": 0.8848, + "mean_token_accuracy": 0.7340844094753265, + "num_tokens": 70506594.0, + "step": 30480 + }, + { + "epoch": 0.279545246172183, + "learning_rate": 0.000144092784450353, + "loss": 0.8555, + "mean_token_accuracy": 0.744951730966568, + "num_tokens": 70529541.0, + "step": 30490 + }, + { + "epoch": 0.2796369304116622, + "learning_rate": 0.00014407444760245714, + "loss": 0.8694, + "mean_token_accuracy": 0.7414206326007843, + "num_tokens": 70553084.0, + "step": 30500 + }, + { + "epoch": 0.27972861465114146, + "learning_rate": 0.0001440561107545613, + "loss": 0.8501, + "mean_token_accuracy": 0.7483701586723328, + "num_tokens": 70576154.0, + "step": 30510 + }, + { + "epoch": 0.2798202988906207, + "learning_rate": 0.00014403777390666544, + "loss": 0.8383, + "mean_token_accuracy": 0.7501836717128754, + "num_tokens": 70599045.0, + "step": 30520 + }, + { + "epoch": 0.27991198313009996, + "learning_rate": 0.0001440194370587696, + "loss": 0.8635, + "mean_token_accuracy": 0.7398757040500641, + "num_tokens": 70622118.0, + "step": 30530 + }, + { + "epoch": 0.28000366736957916, + "learning_rate": 0.00014400110021087377, + "loss": 0.8549, + "mean_token_accuracy": 0.744711983203888, + "num_tokens": 70645721.0, + "step": 30540 + }, + { + "epoch": 0.2800953516090584, + "learning_rate": 0.0001439827633629779, + "loss": 0.8319, + "mean_token_accuracy": 0.7482663452625274, + "num_tokens": 70669074.0, + "step": 30550 + }, + { + "epoch": 0.28018703584853766, + "learning_rate": 0.00014396442651508207, + "loss": 0.8221, + "mean_token_accuracy": 0.7502211153507232, + "num_tokens": 70691889.0, + "step": 30560 + }, + { + "epoch": 0.28027872008801685, + "learning_rate": 0.0001439460896671862, + "loss": 0.8315, + "mean_token_accuracy": 0.7460961759090423, + "num_tokens": 70715519.0, + "step": 30570 + }, + { + "epoch": 0.2803704043274961, + "learning_rate": 0.00014392775281929035, + "loss": 0.8272, + "mean_token_accuracy": 0.7456342220306397, + "num_tokens": 70738545.0, + "step": 30580 + }, + { + "epoch": 0.28046208856697535, + "learning_rate": 0.00014390941597139454, + "loss": 0.8636, + "mean_token_accuracy": 0.7371834278106689, + "num_tokens": 70761485.0, + "step": 30590 + }, + { + "epoch": 0.28055377280645455, + "learning_rate": 0.00014389107912349868, + "loss": 0.858, + "mean_token_accuracy": 0.7476982533931732, + "num_tokens": 70785250.0, + "step": 30600 + }, + { + "epoch": 0.2806454570459338, + "learning_rate": 0.00014387274227560285, + "loss": 0.8226, + "mean_token_accuracy": 0.7469619154930115, + "num_tokens": 70808223.0, + "step": 30610 + }, + { + "epoch": 0.28073714128541305, + "learning_rate": 0.00014385440542770699, + "loss": 0.8946, + "mean_token_accuracy": 0.7383210480213165, + "num_tokens": 70830986.0, + "step": 30620 + }, + { + "epoch": 0.28082882552489224, + "learning_rate": 0.00014383606857981112, + "loss": 0.8498, + "mean_token_accuracy": 0.7438196122646332, + "num_tokens": 70853956.0, + "step": 30630 + }, + { + "epoch": 0.2809205097643715, + "learning_rate": 0.0001438177317319153, + "loss": 0.8523, + "mean_token_accuracy": 0.7453059732913971, + "num_tokens": 70877787.0, + "step": 30640 + }, + { + "epoch": 0.28101219400385075, + "learning_rate": 0.00014379939488401943, + "loss": 0.8188, + "mean_token_accuracy": 0.75405233502388, + "num_tokens": 70900938.0, + "step": 30650 + }, + { + "epoch": 0.28110387824333, + "learning_rate": 0.0001437810580361236, + "loss": 0.8804, + "mean_token_accuracy": 0.7383061647415161, + "num_tokens": 70924212.0, + "step": 30660 + }, + { + "epoch": 0.2811955624828092, + "learning_rate": 0.00014376272118822776, + "loss": 0.8409, + "mean_token_accuracy": 0.745840048789978, + "num_tokens": 70947002.0, + "step": 30670 + }, + { + "epoch": 0.28128724672228844, + "learning_rate": 0.0001437443843403319, + "loss": 0.8286, + "mean_token_accuracy": 0.7478355526924133, + "num_tokens": 70969438.0, + "step": 30680 + }, + { + "epoch": 0.2813789309617677, + "learning_rate": 0.00014372604749243606, + "loss": 0.842, + "mean_token_accuracy": 0.74234339594841, + "num_tokens": 70992775.0, + "step": 30690 + }, + { + "epoch": 0.2814706152012469, + "learning_rate": 0.0001437077106445402, + "loss": 0.8366, + "mean_token_accuracy": 0.7444370150566101, + "num_tokens": 71016071.0, + "step": 30700 + }, + { + "epoch": 0.28156229944072614, + "learning_rate": 0.00014368937379664437, + "loss": 0.8425, + "mean_token_accuracy": 0.7464881598949432, + "num_tokens": 71038736.0, + "step": 30710 + }, + { + "epoch": 0.2816539836802054, + "learning_rate": 0.00014367103694874853, + "loss": 0.8245, + "mean_token_accuracy": 0.7483361184597015, + "num_tokens": 71061500.0, + "step": 30720 + }, + { + "epoch": 0.2817456679196846, + "learning_rate": 0.00014365270010085267, + "loss": 0.8815, + "mean_token_accuracy": 0.7391713559627533, + "num_tokens": 71084834.0, + "step": 30730 + }, + { + "epoch": 0.28183735215916383, + "learning_rate": 0.00014363436325295684, + "loss": 0.862, + "mean_token_accuracy": 0.7401086568832398, + "num_tokens": 71107733.0, + "step": 30740 + }, + { + "epoch": 0.2819290363986431, + "learning_rate": 0.00014361602640506097, + "loss": 0.8587, + "mean_token_accuracy": 0.7415320634841919, + "num_tokens": 71130038.0, + "step": 30750 + }, + { + "epoch": 0.2820207206381223, + "learning_rate": 0.00014359768955716514, + "loss": 0.8745, + "mean_token_accuracy": 0.7403928756713867, + "num_tokens": 71153764.0, + "step": 30760 + }, + { + "epoch": 0.28211240487760153, + "learning_rate": 0.00014357935270926928, + "loss": 0.8647, + "mean_token_accuracy": 0.7437114596366883, + "num_tokens": 71176764.0, + "step": 30770 + }, + { + "epoch": 0.2822040891170808, + "learning_rate": 0.00014356101586137342, + "loss": 0.8858, + "mean_token_accuracy": 0.7416842520236969, + "num_tokens": 71200580.0, + "step": 30780 + }, + { + "epoch": 0.28229577335656003, + "learning_rate": 0.0001435426790134776, + "loss": 0.8533, + "mean_token_accuracy": 0.7468991339206695, + "num_tokens": 71223847.0, + "step": 30790 + }, + { + "epoch": 0.2823874575960392, + "learning_rate": 0.00014352434216558175, + "loss": 0.8709, + "mean_token_accuracy": 0.7413143992424012, + "num_tokens": 71247311.0, + "step": 30800 + }, + { + "epoch": 0.2824791418355185, + "learning_rate": 0.0001435060053176859, + "loss": 0.8798, + "mean_token_accuracy": 0.7401417315006256, + "num_tokens": 71270464.0, + "step": 30810 + }, + { + "epoch": 0.2825708260749977, + "learning_rate": 0.00014348766846979005, + "loss": 0.8277, + "mean_token_accuracy": 0.7541962921619415, + "num_tokens": 71293295.0, + "step": 30820 + }, + { + "epoch": 0.2826625103144769, + "learning_rate": 0.0001434693316218942, + "loss": 0.839, + "mean_token_accuracy": 0.751328992843628, + "num_tokens": 71316894.0, + "step": 30830 + }, + { + "epoch": 0.2827541945539562, + "learning_rate": 0.00014345099477399835, + "loss": 0.8572, + "mean_token_accuracy": 0.746560251712799, + "num_tokens": 71339751.0, + "step": 30840 + }, + { + "epoch": 0.2828458787934354, + "learning_rate": 0.00014343265792610252, + "loss": 0.8152, + "mean_token_accuracy": 0.7542898833751679, + "num_tokens": 71362966.0, + "step": 30850 + }, + { + "epoch": 0.2829375630329146, + "learning_rate": 0.00014341432107820666, + "loss": 0.8849, + "mean_token_accuracy": 0.7338407158851623, + "num_tokens": 71386109.0, + "step": 30860 + }, + { + "epoch": 0.28302924727239387, + "learning_rate": 0.00014339598423031082, + "loss": 0.8696, + "mean_token_accuracy": 0.7444013357162476, + "num_tokens": 71409278.0, + "step": 30870 + }, + { + "epoch": 0.2831209315118731, + "learning_rate": 0.00014337764738241496, + "loss": 0.8533, + "mean_token_accuracy": 0.7491775214672088, + "num_tokens": 71433147.0, + "step": 30880 + }, + { + "epoch": 0.28321261575135237, + "learning_rate": 0.00014335931053451913, + "loss": 0.8571, + "mean_token_accuracy": 0.7481815874576568, + "num_tokens": 71455969.0, + "step": 30890 + }, + { + "epoch": 0.28330429999083157, + "learning_rate": 0.00014334097368662327, + "loss": 0.8394, + "mean_token_accuracy": 0.740744435787201, + "num_tokens": 71479000.0, + "step": 30900 + }, + { + "epoch": 0.2833959842303108, + "learning_rate": 0.00014332263683872743, + "loss": 0.8614, + "mean_token_accuracy": 0.7422500550746918, + "num_tokens": 71502807.0, + "step": 30910 + }, + { + "epoch": 0.28348766846979007, + "learning_rate": 0.0001433042999908316, + "loss": 0.8567, + "mean_token_accuracy": 0.7460370779037475, + "num_tokens": 71525740.0, + "step": 30920 + }, + { + "epoch": 0.28357935270926926, + "learning_rate": 0.00014328596314293573, + "loss": 0.9152, + "mean_token_accuracy": 0.7335561573505401, + "num_tokens": 71548360.0, + "step": 30930 + }, + { + "epoch": 0.2836710369487485, + "learning_rate": 0.0001432676262950399, + "loss": 0.8688, + "mean_token_accuracy": 0.7373440802097321, + "num_tokens": 71571150.0, + "step": 30940 + }, + { + "epoch": 0.28376272118822776, + "learning_rate": 0.00014324928944714404, + "loss": 0.8736, + "mean_token_accuracy": 0.7447324335575104, + "num_tokens": 71594344.0, + "step": 30950 + }, + { + "epoch": 0.28385440542770696, + "learning_rate": 0.0001432309525992482, + "loss": 0.8243, + "mean_token_accuracy": 0.7510844051837922, + "num_tokens": 71616975.0, + "step": 30960 + }, + { + "epoch": 0.2839460896671862, + "learning_rate": 0.00014321261575135234, + "loss": 0.8865, + "mean_token_accuracy": 0.7364141762256622, + "num_tokens": 71640641.0, + "step": 30970 + }, + { + "epoch": 0.28403777390666546, + "learning_rate": 0.0001431942789034565, + "loss": 0.8659, + "mean_token_accuracy": 0.7428589820861816, + "num_tokens": 71663679.0, + "step": 30980 + }, + { + "epoch": 0.28412945814614465, + "learning_rate": 0.00014317594205556067, + "loss": 0.8875, + "mean_token_accuracy": 0.7394986510276794, + "num_tokens": 71686389.0, + "step": 30990 + }, + { + "epoch": 0.2842211423856239, + "learning_rate": 0.0001431576052076648, + "loss": 0.8758, + "mean_token_accuracy": 0.7456152856349945, + "num_tokens": 71709668.0, + "step": 31000 + }, + { + "epoch": 0.28431282662510315, + "learning_rate": 0.00014313926835976898, + "loss": 0.8652, + "mean_token_accuracy": 0.7445572733879089, + "num_tokens": 71732192.0, + "step": 31010 + }, + { + "epoch": 0.2844045108645824, + "learning_rate": 0.00014312093151187311, + "loss": 0.8558, + "mean_token_accuracy": 0.7428758382797241, + "num_tokens": 71755527.0, + "step": 31020 + }, + { + "epoch": 0.2844961951040616, + "learning_rate": 0.00014310259466397725, + "loss": 0.8545, + "mean_token_accuracy": 0.7395639896392823, + "num_tokens": 71779069.0, + "step": 31030 + }, + { + "epoch": 0.28458787934354085, + "learning_rate": 0.00014308425781608142, + "loss": 0.8513, + "mean_token_accuracy": 0.742822241783142, + "num_tokens": 71802376.0, + "step": 31040 + }, + { + "epoch": 0.2846795635830201, + "learning_rate": 0.00014306592096818558, + "loss": 0.8782, + "mean_token_accuracy": 0.741634726524353, + "num_tokens": 71825712.0, + "step": 31050 + }, + { + "epoch": 0.2847712478224993, + "learning_rate": 0.00014304758412028972, + "loss": 0.8739, + "mean_token_accuracy": 0.7346738338470459, + "num_tokens": 71848767.0, + "step": 31060 + }, + { + "epoch": 0.28486293206197855, + "learning_rate": 0.0001430292472723939, + "loss": 0.8763, + "mean_token_accuracy": 0.7358915567398071, + "num_tokens": 71871158.0, + "step": 31070 + }, + { + "epoch": 0.2849546163014578, + "learning_rate": 0.00014301091042449803, + "loss": 0.8511, + "mean_token_accuracy": 0.7476229250431061, + "num_tokens": 71894272.0, + "step": 31080 + }, + { + "epoch": 0.285046300540937, + "learning_rate": 0.0001429925735766022, + "loss": 0.8733, + "mean_token_accuracy": 0.7406140685081481, + "num_tokens": 71918164.0, + "step": 31090 + }, + { + "epoch": 0.28513798478041624, + "learning_rate": 0.00014297423672870633, + "loss": 0.8656, + "mean_token_accuracy": 0.7448238968849182, + "num_tokens": 71941865.0, + "step": 31100 + }, + { + "epoch": 0.2852296690198955, + "learning_rate": 0.0001429558998808105, + "loss": 0.8594, + "mean_token_accuracy": 0.7404263973236084, + "num_tokens": 71965151.0, + "step": 31110 + }, + { + "epoch": 0.2853213532593747, + "learning_rate": 0.00014293756303291466, + "loss": 0.8156, + "mean_token_accuracy": 0.7532539010047913, + "num_tokens": 71988453.0, + "step": 31120 + }, + { + "epoch": 0.28541303749885394, + "learning_rate": 0.0001429192261850188, + "loss": 0.8983, + "mean_token_accuracy": 0.7389238178730011, + "num_tokens": 72011386.0, + "step": 31130 + }, + { + "epoch": 0.2855047217383332, + "learning_rate": 0.00014290088933712296, + "loss": 0.9089, + "mean_token_accuracy": 0.7329099833965301, + "num_tokens": 72034207.0, + "step": 31140 + }, + { + "epoch": 0.28559640597781244, + "learning_rate": 0.0001428825524892271, + "loss": 0.8606, + "mean_token_accuracy": 0.7471947193145752, + "num_tokens": 72057621.0, + "step": 31150 + }, + { + "epoch": 0.28568809021729163, + "learning_rate": 0.00014286421564133127, + "loss": 0.8724, + "mean_token_accuracy": 0.7492359936237335, + "num_tokens": 72079852.0, + "step": 31160 + }, + { + "epoch": 0.2857797744567709, + "learning_rate": 0.0001428458787934354, + "loss": 0.8466, + "mean_token_accuracy": 0.747854334115982, + "num_tokens": 72104097.0, + "step": 31170 + }, + { + "epoch": 0.28587145869625014, + "learning_rate": 0.00014282754194553957, + "loss": 0.9065, + "mean_token_accuracy": 0.7415757656097413, + "num_tokens": 72128268.0, + "step": 31180 + }, + { + "epoch": 0.28596314293572933, + "learning_rate": 0.00014280920509764374, + "loss": 0.83, + "mean_token_accuracy": 0.7463529765605926, + "num_tokens": 72152418.0, + "step": 31190 + }, + { + "epoch": 0.2860548271752086, + "learning_rate": 0.00014279086824974788, + "loss": 0.818, + "mean_token_accuracy": 0.7579379498958587, + "num_tokens": 72175496.0, + "step": 31200 + }, + { + "epoch": 0.28614651141468783, + "learning_rate": 0.00014277253140185204, + "loss": 0.8393, + "mean_token_accuracy": 0.7471842169761658, + "num_tokens": 72198625.0, + "step": 31210 + }, + { + "epoch": 0.286238195654167, + "learning_rate": 0.00014275419455395618, + "loss": 0.8186, + "mean_token_accuracy": 0.7483863472938538, + "num_tokens": 72222112.0, + "step": 31220 + }, + { + "epoch": 0.2863298798936463, + "learning_rate": 0.00014273585770606032, + "loss": 0.84, + "mean_token_accuracy": 0.7470630824565887, + "num_tokens": 72244957.0, + "step": 31230 + }, + { + "epoch": 0.28642156413312553, + "learning_rate": 0.00014271752085816448, + "loss": 0.87, + "mean_token_accuracy": 0.7364301800727844, + "num_tokens": 72267893.0, + "step": 31240 + }, + { + "epoch": 0.2865132483726047, + "learning_rate": 0.00014269918401026865, + "loss": 0.8761, + "mean_token_accuracy": 0.7397234499454498, + "num_tokens": 72291577.0, + "step": 31250 + }, + { + "epoch": 0.286604932612084, + "learning_rate": 0.0001426808471623728, + "loss": 0.829, + "mean_token_accuracy": 0.7466777324676513, + "num_tokens": 72314451.0, + "step": 31260 + }, + { + "epoch": 0.2866966168515632, + "learning_rate": 0.00014266251031447695, + "loss": 0.8717, + "mean_token_accuracy": 0.7358124434947968, + "num_tokens": 72337215.0, + "step": 31270 + }, + { + "epoch": 0.2867883010910425, + "learning_rate": 0.0001426441734665811, + "loss": 0.8797, + "mean_token_accuracy": 0.7377731680870057, + "num_tokens": 72360521.0, + "step": 31280 + }, + { + "epoch": 0.28687998533052167, + "learning_rate": 0.00014262583661868526, + "loss": 0.9012, + "mean_token_accuracy": 0.7384210169315338, + "num_tokens": 72384074.0, + "step": 31290 + }, + { + "epoch": 0.2869716695700009, + "learning_rate": 0.0001426074997707894, + "loss": 0.8515, + "mean_token_accuracy": 0.7453174591064453, + "num_tokens": 72406413.0, + "step": 31300 + }, + { + "epoch": 0.28706335380948017, + "learning_rate": 0.00014258916292289356, + "loss": 0.896, + "mean_token_accuracy": 0.7345102667808533, + "num_tokens": 72430027.0, + "step": 31310 + }, + { + "epoch": 0.28715503804895937, + "learning_rate": 0.00014257082607499773, + "loss": 0.8634, + "mean_token_accuracy": 0.7416463077068329, + "num_tokens": 72452820.0, + "step": 31320 + }, + { + "epoch": 0.2872467222884386, + "learning_rate": 0.00014255248922710186, + "loss": 0.8291, + "mean_token_accuracy": 0.7540943801403046, + "num_tokens": 72475923.0, + "step": 31330 + }, + { + "epoch": 0.28733840652791787, + "learning_rate": 0.00014253415237920603, + "loss": 0.821, + "mean_token_accuracy": 0.748418390750885, + "num_tokens": 72498435.0, + "step": 31340 + }, + { + "epoch": 0.28743009076739706, + "learning_rate": 0.00014251581553131017, + "loss": 0.8536, + "mean_token_accuracy": 0.7409149229526519, + "num_tokens": 72521049.0, + "step": 31350 + }, + { + "epoch": 0.2875217750068763, + "learning_rate": 0.00014249747868341433, + "loss": 0.8704, + "mean_token_accuracy": 0.7396306455135345, + "num_tokens": 72544866.0, + "step": 31360 + }, + { + "epoch": 0.28761345924635556, + "learning_rate": 0.00014247914183551847, + "loss": 0.8469, + "mean_token_accuracy": 0.7428924560546875, + "num_tokens": 72568158.0, + "step": 31370 + }, + { + "epoch": 0.28770514348583476, + "learning_rate": 0.00014246080498762264, + "loss": 0.8989, + "mean_token_accuracy": 0.7329227685928345, + "num_tokens": 72591398.0, + "step": 31380 + }, + { + "epoch": 0.287796827725314, + "learning_rate": 0.0001424424681397268, + "loss": 0.8552, + "mean_token_accuracy": 0.742163461446762, + "num_tokens": 72614580.0, + "step": 31390 + }, + { + "epoch": 0.28788851196479326, + "learning_rate": 0.00014242413129183094, + "loss": 0.8503, + "mean_token_accuracy": 0.7476768851280212, + "num_tokens": 72637245.0, + "step": 31400 + }, + { + "epoch": 0.2879801962042725, + "learning_rate": 0.0001424057944439351, + "loss": 0.8731, + "mean_token_accuracy": 0.7394823253154754, + "num_tokens": 72659984.0, + "step": 31410 + }, + { + "epoch": 0.2880718804437517, + "learning_rate": 0.00014238745759603924, + "loss": 0.843, + "mean_token_accuracy": 0.7433938205242157, + "num_tokens": 72683009.0, + "step": 31420 + }, + { + "epoch": 0.28816356468323095, + "learning_rate": 0.00014236912074814338, + "loss": 0.8716, + "mean_token_accuracy": 0.7435907065868378, + "num_tokens": 72706440.0, + "step": 31430 + }, + { + "epoch": 0.2882552489227102, + "learning_rate": 0.00014235078390024757, + "loss": 0.8393, + "mean_token_accuracy": 0.7424872159957886, + "num_tokens": 72729641.0, + "step": 31440 + }, + { + "epoch": 0.2883469331621894, + "learning_rate": 0.0001423324470523517, + "loss": 0.8858, + "mean_token_accuracy": 0.7388116776943207, + "num_tokens": 72751920.0, + "step": 31450 + }, + { + "epoch": 0.28843861740166865, + "learning_rate": 0.00014231411020445585, + "loss": 0.834, + "mean_token_accuracy": 0.7525705695152283, + "num_tokens": 72775401.0, + "step": 31460 + }, + { + "epoch": 0.2885303016411479, + "learning_rate": 0.00014229577335656002, + "loss": 0.8488, + "mean_token_accuracy": 0.748732203245163, + "num_tokens": 72798287.0, + "step": 31470 + }, + { + "epoch": 0.2886219858806271, + "learning_rate": 0.00014227743650866416, + "loss": 0.8552, + "mean_token_accuracy": 0.7422996640205384, + "num_tokens": 72821016.0, + "step": 31480 + }, + { + "epoch": 0.28871367012010635, + "learning_rate": 0.00014225909966076832, + "loss": 0.9165, + "mean_token_accuracy": 0.733242517709732, + "num_tokens": 72843729.0, + "step": 31490 + }, + { + "epoch": 0.2888053543595856, + "learning_rate": 0.00014224076281287246, + "loss": 0.8356, + "mean_token_accuracy": 0.7454355776309967, + "num_tokens": 72867442.0, + "step": 31500 + }, + { + "epoch": 0.28889703859906485, + "learning_rate": 0.00014222242596497662, + "loss": 0.8887, + "mean_token_accuracy": 0.7318439543247223, + "num_tokens": 72890400.0, + "step": 31510 + }, + { + "epoch": 0.28898872283854404, + "learning_rate": 0.0001422040891170808, + "loss": 0.8894, + "mean_token_accuracy": 0.7362122118473053, + "num_tokens": 72913503.0, + "step": 31520 + }, + { + "epoch": 0.2890804070780233, + "learning_rate": 0.00014218575226918493, + "loss": 0.9052, + "mean_token_accuracy": 0.7309132397174836, + "num_tokens": 72936459.0, + "step": 31530 + }, + { + "epoch": 0.28917209131750254, + "learning_rate": 0.0001421674154212891, + "loss": 0.9119, + "mean_token_accuracy": 0.7345360696315766, + "num_tokens": 72959987.0, + "step": 31540 + }, + { + "epoch": 0.28926377555698174, + "learning_rate": 0.00014214907857339323, + "loss": 0.8745, + "mean_token_accuracy": 0.739002925157547, + "num_tokens": 72982358.0, + "step": 31550 + }, + { + "epoch": 0.289355459796461, + "learning_rate": 0.0001421307417254974, + "loss": 0.8404, + "mean_token_accuracy": 0.7455204069614411, + "num_tokens": 73005658.0, + "step": 31560 + }, + { + "epoch": 0.28944714403594024, + "learning_rate": 0.00014211240487760156, + "loss": 0.8405, + "mean_token_accuracy": 0.7440772473812103, + "num_tokens": 73029475.0, + "step": 31570 + }, + { + "epoch": 0.28953882827541944, + "learning_rate": 0.0001420940680297057, + "loss": 0.8486, + "mean_token_accuracy": 0.7433251142501831, + "num_tokens": 73052807.0, + "step": 31580 + }, + { + "epoch": 0.2896305125148987, + "learning_rate": 0.00014207573118180987, + "loss": 0.8068, + "mean_token_accuracy": 0.7552599966526031, + "num_tokens": 73075825.0, + "step": 31590 + }, + { + "epoch": 0.28972219675437794, + "learning_rate": 0.000142057394333914, + "loss": 0.8596, + "mean_token_accuracy": 0.7442369043827057, + "num_tokens": 73100114.0, + "step": 31600 + }, + { + "epoch": 0.28981388099385713, + "learning_rate": 0.00014203905748601817, + "loss": 0.8543, + "mean_token_accuracy": 0.7419051170349121, + "num_tokens": 73122940.0, + "step": 31610 + }, + { + "epoch": 0.2899055652333364, + "learning_rate": 0.0001420207206381223, + "loss": 0.8841, + "mean_token_accuracy": 0.7381398737430572, + "num_tokens": 73145978.0, + "step": 31620 + }, + { + "epoch": 0.28999724947281563, + "learning_rate": 0.00014200238379022645, + "loss": 0.8814, + "mean_token_accuracy": 0.7453715085983277, + "num_tokens": 73168783.0, + "step": 31630 + }, + { + "epoch": 0.2900889337122949, + "learning_rate": 0.00014198404694233064, + "loss": 0.8441, + "mean_token_accuracy": 0.7435619235038757, + "num_tokens": 73191613.0, + "step": 31640 + }, + { + "epoch": 0.2901806179517741, + "learning_rate": 0.00014196571009443478, + "loss": 0.8577, + "mean_token_accuracy": 0.7409064710140228, + "num_tokens": 73214562.0, + "step": 31650 + }, + { + "epoch": 0.29027230219125333, + "learning_rate": 0.00014194737324653892, + "loss": 0.8651, + "mean_token_accuracy": 0.7437946617603302, + "num_tokens": 73237810.0, + "step": 31660 + }, + { + "epoch": 0.2903639864307326, + "learning_rate": 0.00014192903639864308, + "loss": 0.8256, + "mean_token_accuracy": 0.7505256474018097, + "num_tokens": 73260321.0, + "step": 31670 + }, + { + "epoch": 0.2904556706702118, + "learning_rate": 0.00014191069955074722, + "loss": 0.8271, + "mean_token_accuracy": 0.7476964652538299, + "num_tokens": 73283163.0, + "step": 31680 + }, + { + "epoch": 0.290547354909691, + "learning_rate": 0.00014189236270285138, + "loss": 0.8846, + "mean_token_accuracy": 0.7330077946186065, + "num_tokens": 73306138.0, + "step": 31690 + }, + { + "epoch": 0.2906390391491703, + "learning_rate": 0.00014187402585495555, + "loss": 0.8843, + "mean_token_accuracy": 0.7401116073131562, + "num_tokens": 73330472.0, + "step": 31700 + }, + { + "epoch": 0.29073072338864947, + "learning_rate": 0.0001418556890070597, + "loss": 0.8598, + "mean_token_accuracy": 0.744620555639267, + "num_tokens": 73353624.0, + "step": 31710 + }, + { + "epoch": 0.2908224076281287, + "learning_rate": 0.00014183735215916385, + "loss": 0.8006, + "mean_token_accuracy": 0.7572574019432068, + "num_tokens": 73375890.0, + "step": 31720 + }, + { + "epoch": 0.29091409186760797, + "learning_rate": 0.000141819015311268, + "loss": 0.8572, + "mean_token_accuracy": 0.7402051568031311, + "num_tokens": 73399379.0, + "step": 31730 + }, + { + "epoch": 0.29100577610708717, + "learning_rate": 0.00014180067846337216, + "loss": 0.8812, + "mean_token_accuracy": 0.7400589942932129, + "num_tokens": 73422434.0, + "step": 31740 + }, + { + "epoch": 0.2910974603465664, + "learning_rate": 0.0001417823416154763, + "loss": 0.8361, + "mean_token_accuracy": 0.7483542859554291, + "num_tokens": 73445375.0, + "step": 31750 + }, + { + "epoch": 0.29118914458604567, + "learning_rate": 0.00014176400476758046, + "loss": 0.8666, + "mean_token_accuracy": 0.7430842816829681, + "num_tokens": 73469386.0, + "step": 31760 + }, + { + "epoch": 0.2912808288255249, + "learning_rate": 0.00014174566791968463, + "loss": 0.8514, + "mean_token_accuracy": 0.7490638792514801, + "num_tokens": 73493032.0, + "step": 31770 + }, + { + "epoch": 0.2913725130650041, + "learning_rate": 0.00014172733107178877, + "loss": 0.8882, + "mean_token_accuracy": 0.7369000732898712, + "num_tokens": 73516028.0, + "step": 31780 + }, + { + "epoch": 0.29146419730448336, + "learning_rate": 0.00014170899422389293, + "loss": 0.8378, + "mean_token_accuracy": 0.7542305409908294, + "num_tokens": 73538543.0, + "step": 31790 + }, + { + "epoch": 0.2915558815439626, + "learning_rate": 0.00014169065737599707, + "loss": 0.8599, + "mean_token_accuracy": 0.7383139252662658, + "num_tokens": 73561062.0, + "step": 31800 + }, + { + "epoch": 0.2916475657834418, + "learning_rate": 0.00014167232052810123, + "loss": 0.8321, + "mean_token_accuracy": 0.7473494529724121, + "num_tokens": 73583815.0, + "step": 31810 + }, + { + "epoch": 0.29173925002292106, + "learning_rate": 0.00014165398368020537, + "loss": 0.8517, + "mean_token_accuracy": 0.741040050983429, + "num_tokens": 73607221.0, + "step": 31820 + }, + { + "epoch": 0.2918309342624003, + "learning_rate": 0.00014163564683230954, + "loss": 0.8251, + "mean_token_accuracy": 0.75463907122612, + "num_tokens": 73630164.0, + "step": 31830 + }, + { + "epoch": 0.2919226185018795, + "learning_rate": 0.0001416173099844137, + "loss": 0.8456, + "mean_token_accuracy": 0.7428629636764527, + "num_tokens": 73653482.0, + "step": 31840 + }, + { + "epoch": 0.29201430274135876, + "learning_rate": 0.00014159897313651784, + "loss": 0.8516, + "mean_token_accuracy": 0.7402035355567932, + "num_tokens": 73676116.0, + "step": 31850 + }, + { + "epoch": 0.292105986980838, + "learning_rate": 0.00014158063628862198, + "loss": 0.8303, + "mean_token_accuracy": 0.7501801729202271, + "num_tokens": 73699175.0, + "step": 31860 + }, + { + "epoch": 0.2921976712203172, + "learning_rate": 0.00014156229944072615, + "loss": 0.8469, + "mean_token_accuracy": 0.7425274848937988, + "num_tokens": 73722392.0, + "step": 31870 + }, + { + "epoch": 0.29228935545979645, + "learning_rate": 0.00014154396259283028, + "loss": 0.8236, + "mean_token_accuracy": 0.7515719771385193, + "num_tokens": 73745307.0, + "step": 31880 + }, + { + "epoch": 0.2923810396992757, + "learning_rate": 0.00014152562574493445, + "loss": 0.8413, + "mean_token_accuracy": 0.7502724707126618, + "num_tokens": 73768673.0, + "step": 31890 + }, + { + "epoch": 0.29247272393875495, + "learning_rate": 0.00014150728889703861, + "loss": 0.8771, + "mean_token_accuracy": 0.7392754435539246, + "num_tokens": 73791261.0, + "step": 31900 + }, + { + "epoch": 0.29256440817823415, + "learning_rate": 0.00014148895204914275, + "loss": 0.8344, + "mean_token_accuracy": 0.7486158907413483, + "num_tokens": 73813887.0, + "step": 31910 + }, + { + "epoch": 0.2926560924177134, + "learning_rate": 0.00014147061520124692, + "loss": 0.8244, + "mean_token_accuracy": 0.7549403071403503, + "num_tokens": 73836544.0, + "step": 31920 + }, + { + "epoch": 0.29274777665719265, + "learning_rate": 0.00014145227835335106, + "loss": 0.8586, + "mean_token_accuracy": 0.7428262293338775, + "num_tokens": 73859671.0, + "step": 31930 + }, + { + "epoch": 0.29283946089667184, + "learning_rate": 0.00014143394150545522, + "loss": 0.8345, + "mean_token_accuracy": 0.7449959874153137, + "num_tokens": 73882330.0, + "step": 31940 + }, + { + "epoch": 0.2929311451361511, + "learning_rate": 0.00014141560465755936, + "loss": 0.8951, + "mean_token_accuracy": 0.7362458229064941, + "num_tokens": 73905308.0, + "step": 31950 + }, + { + "epoch": 0.29302282937563034, + "learning_rate": 0.00014139726780966353, + "loss": 0.8614, + "mean_token_accuracy": 0.7479972541332245, + "num_tokens": 73928426.0, + "step": 31960 + }, + { + "epoch": 0.29311451361510954, + "learning_rate": 0.0001413789309617677, + "loss": 0.8455, + "mean_token_accuracy": 0.7483917891979217, + "num_tokens": 73952447.0, + "step": 31970 + }, + { + "epoch": 0.2932061978545888, + "learning_rate": 0.00014136059411387183, + "loss": 0.8445, + "mean_token_accuracy": 0.7439047753810882, + "num_tokens": 73975454.0, + "step": 31980 + }, + { + "epoch": 0.29329788209406804, + "learning_rate": 0.000141342257265976, + "loss": 0.8764, + "mean_token_accuracy": 0.7404709458351135, + "num_tokens": 73999058.0, + "step": 31990 + }, + { + "epoch": 0.29338956633354724, + "learning_rate": 0.00014132392041808013, + "loss": 0.8678, + "mean_token_accuracy": 0.7416110396385193, + "num_tokens": 74021635.0, + "step": 32000 + }, + { + "epoch": 0.2934812505730265, + "learning_rate": 0.0001413055835701843, + "loss": 0.8866, + "mean_token_accuracy": 0.7399464905261993, + "num_tokens": 74044911.0, + "step": 32010 + }, + { + "epoch": 0.29357293481250574, + "learning_rate": 0.00014128724672228844, + "loss": 0.8308, + "mean_token_accuracy": 0.7489681363105773, + "num_tokens": 74068136.0, + "step": 32020 + }, + { + "epoch": 0.293664619051985, + "learning_rate": 0.0001412689098743926, + "loss": 0.8597, + "mean_token_accuracy": 0.7433870613574982, + "num_tokens": 74090667.0, + "step": 32030 + }, + { + "epoch": 0.2937563032914642, + "learning_rate": 0.00014125057302649677, + "loss": 0.898, + "mean_token_accuracy": 0.7378264725208282, + "num_tokens": 74114025.0, + "step": 32040 + }, + { + "epoch": 0.29384798753094343, + "learning_rate": 0.0001412322361786009, + "loss": 0.8597, + "mean_token_accuracy": 0.7399658620357513, + "num_tokens": 74136459.0, + "step": 32050 + }, + { + "epoch": 0.2939396717704227, + "learning_rate": 0.00014121389933070504, + "loss": 0.8756, + "mean_token_accuracy": 0.7452867448329925, + "num_tokens": 74159395.0, + "step": 32060 + }, + { + "epoch": 0.2940313560099019, + "learning_rate": 0.0001411955624828092, + "loss": 0.8425, + "mean_token_accuracy": 0.7508084893226623, + "num_tokens": 74182500.0, + "step": 32070 + }, + { + "epoch": 0.29412304024938113, + "learning_rate": 0.00014117722563491335, + "loss": 0.8487, + "mean_token_accuracy": 0.7505961298942566, + "num_tokens": 74205656.0, + "step": 32080 + }, + { + "epoch": 0.2942147244888604, + "learning_rate": 0.00014115888878701754, + "loss": 0.88, + "mean_token_accuracy": 0.7409342706203461, + "num_tokens": 74228330.0, + "step": 32090 + }, + { + "epoch": 0.2943064087283396, + "learning_rate": 0.00014114055193912168, + "loss": 0.8368, + "mean_token_accuracy": 0.7509453773498536, + "num_tokens": 74251978.0, + "step": 32100 + }, + { + "epoch": 0.2943980929678188, + "learning_rate": 0.00014112221509122582, + "loss": 0.8987, + "mean_token_accuracy": 0.7340470790863037, + "num_tokens": 74275035.0, + "step": 32110 + }, + { + "epoch": 0.2944897772072981, + "learning_rate": 0.00014110387824332998, + "loss": 0.8391, + "mean_token_accuracy": 0.7468198537826538, + "num_tokens": 74298321.0, + "step": 32120 + }, + { + "epoch": 0.2945814614467773, + "learning_rate": 0.00014108554139543412, + "loss": 0.8537, + "mean_token_accuracy": 0.7403269171714782, + "num_tokens": 74320919.0, + "step": 32130 + }, + { + "epoch": 0.2946731456862565, + "learning_rate": 0.0001410672045475383, + "loss": 0.827, + "mean_token_accuracy": 0.7486122071743011, + "num_tokens": 74343472.0, + "step": 32140 + }, + { + "epoch": 0.29476482992573577, + "learning_rate": 0.00014104886769964243, + "loss": 0.9174, + "mean_token_accuracy": 0.7354245066642762, + "num_tokens": 74366550.0, + "step": 32150 + }, + { + "epoch": 0.294856514165215, + "learning_rate": 0.0001410305308517466, + "loss": 0.8719, + "mean_token_accuracy": 0.7446018040180207, + "num_tokens": 74389540.0, + "step": 32160 + }, + { + "epoch": 0.2949481984046942, + "learning_rate": 0.00014101219400385076, + "loss": 0.8509, + "mean_token_accuracy": 0.7483080565929413, + "num_tokens": 74412838.0, + "step": 32170 + }, + { + "epoch": 0.29503988264417347, + "learning_rate": 0.0001409938571559549, + "loss": 0.8479, + "mean_token_accuracy": 0.7413890719413757, + "num_tokens": 74436548.0, + "step": 32180 + }, + { + "epoch": 0.2951315668836527, + "learning_rate": 0.00014097552030805906, + "loss": 0.8748, + "mean_token_accuracy": 0.74229536652565, + "num_tokens": 74460687.0, + "step": 32190 + }, + { + "epoch": 0.2952232511231319, + "learning_rate": 0.0001409571834601632, + "loss": 0.8407, + "mean_token_accuracy": 0.7461408078670502, + "num_tokens": 74483701.0, + "step": 32200 + }, + { + "epoch": 0.29531493536261116, + "learning_rate": 0.00014093884661226736, + "loss": 0.8704, + "mean_token_accuracy": 0.7388374507427216, + "num_tokens": 74506773.0, + "step": 32210 + }, + { + "epoch": 0.2954066196020904, + "learning_rate": 0.00014092050976437153, + "loss": 0.8081, + "mean_token_accuracy": 0.755785596370697, + "num_tokens": 74529366.0, + "step": 32220 + }, + { + "epoch": 0.2954983038415696, + "learning_rate": 0.00014090217291647567, + "loss": 0.8629, + "mean_token_accuracy": 0.741152960062027, + "num_tokens": 74552644.0, + "step": 32230 + }, + { + "epoch": 0.29558998808104886, + "learning_rate": 0.00014088383606857983, + "loss": 0.8309, + "mean_token_accuracy": 0.7479057490825654, + "num_tokens": 74575039.0, + "step": 32240 + }, + { + "epoch": 0.2956816723205281, + "learning_rate": 0.00014086549922068397, + "loss": 0.833, + "mean_token_accuracy": 0.7457516610622406, + "num_tokens": 74598000.0, + "step": 32250 + }, + { + "epoch": 0.29577335656000736, + "learning_rate": 0.0001408471623727881, + "loss": 0.8545, + "mean_token_accuracy": 0.7434446692466736, + "num_tokens": 74620147.0, + "step": 32260 + }, + { + "epoch": 0.29586504079948656, + "learning_rate": 0.00014082882552489227, + "loss": 0.8512, + "mean_token_accuracy": 0.7454415023326874, + "num_tokens": 74642345.0, + "step": 32270 + }, + { + "epoch": 0.2959567250389658, + "learning_rate": 0.0001408104886769964, + "loss": 0.8257, + "mean_token_accuracy": 0.7547140061855316, + "num_tokens": 74666155.0, + "step": 32280 + }, + { + "epoch": 0.29604840927844506, + "learning_rate": 0.0001407921518291006, + "loss": 0.8205, + "mean_token_accuracy": 0.7539973735809327, + "num_tokens": 74688943.0, + "step": 32290 + }, + { + "epoch": 0.29614009351792425, + "learning_rate": 0.00014077381498120474, + "loss": 0.8315, + "mean_token_accuracy": 0.7428905308246613, + "num_tokens": 74711307.0, + "step": 32300 + }, + { + "epoch": 0.2962317777574035, + "learning_rate": 0.00014075547813330888, + "loss": 0.8432, + "mean_token_accuracy": 0.7513552963733673, + "num_tokens": 74733617.0, + "step": 32310 + }, + { + "epoch": 0.29632346199688275, + "learning_rate": 0.00014073714128541305, + "loss": 0.8984, + "mean_token_accuracy": 0.732017582654953, + "num_tokens": 74756660.0, + "step": 32320 + }, + { + "epoch": 0.29641514623636195, + "learning_rate": 0.00014071880443751719, + "loss": 0.8261, + "mean_token_accuracy": 0.750505793094635, + "num_tokens": 74779023.0, + "step": 32330 + }, + { + "epoch": 0.2965068304758412, + "learning_rate": 0.00014070046758962135, + "loss": 0.8321, + "mean_token_accuracy": 0.745517760515213, + "num_tokens": 74802343.0, + "step": 32340 + }, + { + "epoch": 0.29659851471532045, + "learning_rate": 0.00014068213074172552, + "loss": 0.8585, + "mean_token_accuracy": 0.7482177495956421, + "num_tokens": 74825804.0, + "step": 32350 + }, + { + "epoch": 0.29669019895479964, + "learning_rate": 0.00014066379389382965, + "loss": 0.839, + "mean_token_accuracy": 0.7464603304862976, + "num_tokens": 74850115.0, + "step": 32360 + }, + { + "epoch": 0.2967818831942789, + "learning_rate": 0.00014064545704593382, + "loss": 0.8827, + "mean_token_accuracy": 0.7317130923271179, + "num_tokens": 74873543.0, + "step": 32370 + }, + { + "epoch": 0.29687356743375815, + "learning_rate": 0.00014062712019803796, + "loss": 0.8646, + "mean_token_accuracy": 0.7418008387088776, + "num_tokens": 74896263.0, + "step": 32380 + }, + { + "epoch": 0.2969652516732374, + "learning_rate": 0.00014060878335014212, + "loss": 0.8314, + "mean_token_accuracy": 0.7491295874118805, + "num_tokens": 74918428.0, + "step": 32390 + }, + { + "epoch": 0.2970569359127166, + "learning_rate": 0.00014059044650224626, + "loss": 0.805, + "mean_token_accuracy": 0.7593595862388611, + "num_tokens": 74941764.0, + "step": 32400 + }, + { + "epoch": 0.29714862015219584, + "learning_rate": 0.00014057210965435043, + "loss": 0.8416, + "mean_token_accuracy": 0.7525422215461731, + "num_tokens": 74965617.0, + "step": 32410 + }, + { + "epoch": 0.2972403043916751, + "learning_rate": 0.0001405537728064546, + "loss": 0.8279, + "mean_token_accuracy": 0.747933852672577, + "num_tokens": 74988959.0, + "step": 32420 + }, + { + "epoch": 0.2973319886311543, + "learning_rate": 0.00014053543595855873, + "loss": 0.8478, + "mean_token_accuracy": 0.7457592070102692, + "num_tokens": 75012040.0, + "step": 32430 + }, + { + "epoch": 0.29742367287063354, + "learning_rate": 0.0001405170991106629, + "loss": 0.8385, + "mean_token_accuracy": 0.7494657516479493, + "num_tokens": 75035529.0, + "step": 32440 + }, + { + "epoch": 0.2975153571101128, + "learning_rate": 0.00014049876226276704, + "loss": 0.8677, + "mean_token_accuracy": 0.7418507039546967, + "num_tokens": 75058556.0, + "step": 32450 + }, + { + "epoch": 0.297607041349592, + "learning_rate": 0.00014048042541487117, + "loss": 0.8996, + "mean_token_accuracy": 0.7299916386604309, + "num_tokens": 75081452.0, + "step": 32460 + }, + { + "epoch": 0.29769872558907123, + "learning_rate": 0.00014046208856697534, + "loss": 0.8431, + "mean_token_accuracy": 0.7505478620529175, + "num_tokens": 75104868.0, + "step": 32470 + }, + { + "epoch": 0.2977904098285505, + "learning_rate": 0.00014044375171907948, + "loss": 0.8368, + "mean_token_accuracy": 0.7543375313282012, + "num_tokens": 75128512.0, + "step": 32480 + }, + { + "epoch": 0.2978820940680297, + "learning_rate": 0.00014042541487118367, + "loss": 0.8516, + "mean_token_accuracy": 0.7499530851840973, + "num_tokens": 75151795.0, + "step": 32490 + }, + { + "epoch": 0.29797377830750893, + "learning_rate": 0.0001404070780232878, + "loss": 0.8384, + "mean_token_accuracy": 0.7483568310737609, + "num_tokens": 75174689.0, + "step": 32500 + }, + { + "epoch": 0.2980654625469882, + "learning_rate": 0.00014038874117539195, + "loss": 0.8768, + "mean_token_accuracy": 0.7385094165802002, + "num_tokens": 75197103.0, + "step": 32510 + }, + { + "epoch": 0.29815714678646743, + "learning_rate": 0.0001403704043274961, + "loss": 0.8555, + "mean_token_accuracy": 0.7431336998939514, + "num_tokens": 75220996.0, + "step": 32520 + }, + { + "epoch": 0.2982488310259466, + "learning_rate": 0.00014035206747960025, + "loss": 0.8396, + "mean_token_accuracy": 0.7378594398498535, + "num_tokens": 75244686.0, + "step": 32530 + }, + { + "epoch": 0.2983405152654259, + "learning_rate": 0.00014033373063170442, + "loss": 0.8554, + "mean_token_accuracy": 0.7430776119232178, + "num_tokens": 75266932.0, + "step": 32540 + }, + { + "epoch": 0.2984321995049051, + "learning_rate": 0.00014031539378380858, + "loss": 0.8585, + "mean_token_accuracy": 0.7432925641536713, + "num_tokens": 75290657.0, + "step": 32550 + }, + { + "epoch": 0.2985238837443843, + "learning_rate": 0.00014029705693591272, + "loss": 0.8475, + "mean_token_accuracy": 0.7460358500480652, + "num_tokens": 75314025.0, + "step": 32560 + }, + { + "epoch": 0.2986155679838636, + "learning_rate": 0.00014027872008801688, + "loss": 0.8363, + "mean_token_accuracy": 0.7493690609931946, + "num_tokens": 75336336.0, + "step": 32570 + }, + { + "epoch": 0.2987072522233428, + "learning_rate": 0.00014026038324012102, + "loss": 0.906, + "mean_token_accuracy": 0.7391089081764222, + "num_tokens": 75359158.0, + "step": 32580 + }, + { + "epoch": 0.298798936462822, + "learning_rate": 0.0001402420463922252, + "loss": 0.8353, + "mean_token_accuracy": 0.7448742389678955, + "num_tokens": 75381898.0, + "step": 32590 + }, + { + "epoch": 0.29889062070230127, + "learning_rate": 0.00014022370954432933, + "loss": 0.8596, + "mean_token_accuracy": 0.7458133399486542, + "num_tokens": 75405062.0, + "step": 32600 + }, + { + "epoch": 0.2989823049417805, + "learning_rate": 0.0001402053726964335, + "loss": 0.8442, + "mean_token_accuracy": 0.7488585948944092, + "num_tokens": 75428130.0, + "step": 32610 + }, + { + "epoch": 0.2990739891812597, + "learning_rate": 0.00014018703584853766, + "loss": 0.8337, + "mean_token_accuracy": 0.7478954017162323, + "num_tokens": 75450520.0, + "step": 32620 + }, + { + "epoch": 0.29916567342073896, + "learning_rate": 0.0001401686990006418, + "loss": 0.8863, + "mean_token_accuracy": 0.7290149629116058, + "num_tokens": 75473367.0, + "step": 32630 + }, + { + "epoch": 0.2992573576602182, + "learning_rate": 0.00014015036215274596, + "loss": 0.856, + "mean_token_accuracy": 0.7386962234973907, + "num_tokens": 75496775.0, + "step": 32640 + }, + { + "epoch": 0.29934904189969747, + "learning_rate": 0.0001401320253048501, + "loss": 0.8657, + "mean_token_accuracy": 0.7430225610733032, + "num_tokens": 75520106.0, + "step": 32650 + }, + { + "epoch": 0.29944072613917666, + "learning_rate": 0.00014011368845695424, + "loss": 0.8625, + "mean_token_accuracy": 0.7468016922473908, + "num_tokens": 75543050.0, + "step": 32660 + }, + { + "epoch": 0.2995324103786559, + "learning_rate": 0.0001400953516090584, + "loss": 0.8398, + "mean_token_accuracy": 0.7432979285717011, + "num_tokens": 75566710.0, + "step": 32670 + }, + { + "epoch": 0.29962409461813516, + "learning_rate": 0.00014007701476116257, + "loss": 0.8289, + "mean_token_accuracy": 0.7504425466060638, + "num_tokens": 75589624.0, + "step": 32680 + }, + { + "epoch": 0.29971577885761436, + "learning_rate": 0.00014005867791326673, + "loss": 0.8293, + "mean_token_accuracy": 0.747108769416809, + "num_tokens": 75612434.0, + "step": 32690 + }, + { + "epoch": 0.2998074630970936, + "learning_rate": 0.00014004034106537087, + "loss": 0.8254, + "mean_token_accuracy": 0.754813802242279, + "num_tokens": 75636279.0, + "step": 32700 + }, + { + "epoch": 0.29989914733657286, + "learning_rate": 0.000140022004217475, + "loss": 0.8211, + "mean_token_accuracy": 0.7556751549243927, + "num_tokens": 75659171.0, + "step": 32710 + }, + { + "epoch": 0.29999083157605205, + "learning_rate": 0.00014000366736957918, + "loss": 0.8486, + "mean_token_accuracy": 0.7435480654239655, + "num_tokens": 75682235.0, + "step": 32720 + }, + { + "epoch": 0.3000825158155313, + "learning_rate": 0.00013998533052168331, + "loss": 0.8572, + "mean_token_accuracy": 0.7503647685050965, + "num_tokens": 75705256.0, + "step": 32730 + }, + { + "epoch": 0.30017420005501055, + "learning_rate": 0.00013996699367378748, + "loss": 0.849, + "mean_token_accuracy": 0.7448776602745056, + "num_tokens": 75728535.0, + "step": 32740 + }, + { + "epoch": 0.3002658842944898, + "learning_rate": 0.00013994865682589165, + "loss": 0.8409, + "mean_token_accuracy": 0.7476956903934479, + "num_tokens": 75752096.0, + "step": 32750 + }, + { + "epoch": 0.300357568533969, + "learning_rate": 0.00013993031997799578, + "loss": 0.8838, + "mean_token_accuracy": 0.7399802386760712, + "num_tokens": 75774942.0, + "step": 32760 + }, + { + "epoch": 0.30044925277344825, + "learning_rate": 0.00013991198313009995, + "loss": 0.8464, + "mean_token_accuracy": 0.752990335226059, + "num_tokens": 75797111.0, + "step": 32770 + }, + { + "epoch": 0.3005409370129275, + "learning_rate": 0.0001398936462822041, + "loss": 0.8609, + "mean_token_accuracy": 0.736510944366455, + "num_tokens": 75819608.0, + "step": 32780 + }, + { + "epoch": 0.3006326212524067, + "learning_rate": 0.00013987530943430825, + "loss": 0.8671, + "mean_token_accuracy": 0.7408483803272248, + "num_tokens": 75842093.0, + "step": 32790 + }, + { + "epoch": 0.30072430549188595, + "learning_rate": 0.0001398569725864124, + "loss": 0.8363, + "mean_token_accuracy": 0.7478606402873993, + "num_tokens": 75865258.0, + "step": 32800 + }, + { + "epoch": 0.3008159897313652, + "learning_rate": 0.00013983863573851656, + "loss": 0.8739, + "mean_token_accuracy": 0.7317023873329163, + "num_tokens": 75888126.0, + "step": 32810 + }, + { + "epoch": 0.3009076739708444, + "learning_rate": 0.00013982029889062072, + "loss": 0.8636, + "mean_token_accuracy": 0.7460320651531219, + "num_tokens": 75911310.0, + "step": 32820 + }, + { + "epoch": 0.30099935821032364, + "learning_rate": 0.00013980196204272486, + "loss": 0.8217, + "mean_token_accuracy": 0.7521295309066772, + "num_tokens": 75933653.0, + "step": 32830 + }, + { + "epoch": 0.3010910424498029, + "learning_rate": 0.00013978362519482903, + "loss": 0.8238, + "mean_token_accuracy": 0.7496893882751465, + "num_tokens": 75955649.0, + "step": 32840 + }, + { + "epoch": 0.3011827266892821, + "learning_rate": 0.00013976528834693316, + "loss": 0.8675, + "mean_token_accuracy": 0.7385407745838165, + "num_tokens": 75978503.0, + "step": 32850 + }, + { + "epoch": 0.30127441092876134, + "learning_rate": 0.0001397469514990373, + "loss": 0.851, + "mean_token_accuracy": 0.7472930252552032, + "num_tokens": 76001930.0, + "step": 32860 + }, + { + "epoch": 0.3013660951682406, + "learning_rate": 0.00013972861465114147, + "loss": 0.8601, + "mean_token_accuracy": 0.7451577663421631, + "num_tokens": 76024711.0, + "step": 32870 + }, + { + "epoch": 0.30145777940771984, + "learning_rate": 0.00013971027780324563, + "loss": 0.8251, + "mean_token_accuracy": 0.7494319319725037, + "num_tokens": 76047325.0, + "step": 32880 + }, + { + "epoch": 0.30154946364719903, + "learning_rate": 0.0001396919409553498, + "loss": 0.8759, + "mean_token_accuracy": 0.7339219331741333, + "num_tokens": 76070650.0, + "step": 32890 + }, + { + "epoch": 0.3016411478866783, + "learning_rate": 0.00013967360410745394, + "loss": 0.8827, + "mean_token_accuracy": 0.7390013694763183, + "num_tokens": 76093518.0, + "step": 32900 + }, + { + "epoch": 0.30173283212615754, + "learning_rate": 0.00013965526725955808, + "loss": 0.8396, + "mean_token_accuracy": 0.7473307371139526, + "num_tokens": 76116985.0, + "step": 32910 + }, + { + "epoch": 0.30182451636563673, + "learning_rate": 0.00013963693041166224, + "loss": 0.87, + "mean_token_accuracy": 0.7436900436878204, + "num_tokens": 76140208.0, + "step": 32920 + }, + { + "epoch": 0.301916200605116, + "learning_rate": 0.00013961859356376638, + "loss": 0.85, + "mean_token_accuracy": 0.7430337429046631, + "num_tokens": 76163444.0, + "step": 32930 + }, + { + "epoch": 0.30200788484459523, + "learning_rate": 0.00013960025671587057, + "loss": 0.8636, + "mean_token_accuracy": 0.7484816789627076, + "num_tokens": 76186322.0, + "step": 32940 + }, + { + "epoch": 0.3020995690840744, + "learning_rate": 0.0001395819198679747, + "loss": 0.8329, + "mean_token_accuracy": 0.7511256515979767, + "num_tokens": 76208826.0, + "step": 32950 + }, + { + "epoch": 0.3021912533235537, + "learning_rate": 0.00013956358302007885, + "loss": 0.8322, + "mean_token_accuracy": 0.752809476852417, + "num_tokens": 76232270.0, + "step": 32960 + }, + { + "epoch": 0.3022829375630329, + "learning_rate": 0.00013954524617218301, + "loss": 0.844, + "mean_token_accuracy": 0.7424205303192138, + "num_tokens": 76255069.0, + "step": 32970 + }, + { + "epoch": 0.3023746218025121, + "learning_rate": 0.00013952690932428715, + "loss": 0.8378, + "mean_token_accuracy": 0.7539783895015717, + "num_tokens": 76278489.0, + "step": 32980 + }, + { + "epoch": 0.3024663060419914, + "learning_rate": 0.00013950857247639132, + "loss": 0.8594, + "mean_token_accuracy": 0.7450504243373871, + "num_tokens": 76300346.0, + "step": 32990 + }, + { + "epoch": 0.3025579902814706, + "learning_rate": 0.00013949023562849546, + "loss": 0.846, + "mean_token_accuracy": 0.7447242200374603, + "num_tokens": 76323112.0, + "step": 33000 + }, + { + "epoch": 0.3026496745209499, + "learning_rate": 0.00013947189878059962, + "loss": 0.8101, + "mean_token_accuracy": 0.7504319071769714, + "num_tokens": 76345720.0, + "step": 33010 + }, + { + "epoch": 0.30274135876042907, + "learning_rate": 0.0001394535619327038, + "loss": 0.859, + "mean_token_accuracy": 0.7491183936595917, + "num_tokens": 76368925.0, + "step": 33020 + }, + { + "epoch": 0.3028330429999083, + "learning_rate": 0.00013943522508480792, + "loss": 0.8243, + "mean_token_accuracy": 0.7520512044429779, + "num_tokens": 76392125.0, + "step": 33030 + }, + { + "epoch": 0.30292472723938757, + "learning_rate": 0.0001394168882369121, + "loss": 0.8565, + "mean_token_accuracy": 0.7417470753192902, + "num_tokens": 76414784.0, + "step": 33040 + }, + { + "epoch": 0.30301641147886677, + "learning_rate": 0.00013939855138901623, + "loss": 0.8523, + "mean_token_accuracy": 0.7458143174648285, + "num_tokens": 76438553.0, + "step": 33050 + }, + { + "epoch": 0.303108095718346, + "learning_rate": 0.00013938021454112037, + "loss": 0.8357, + "mean_token_accuracy": 0.7528502702713012, + "num_tokens": 76461596.0, + "step": 33060 + }, + { + "epoch": 0.30319977995782527, + "learning_rate": 0.00013936187769322456, + "loss": 0.8864, + "mean_token_accuracy": 0.7383783102035523, + "num_tokens": 76484693.0, + "step": 33070 + }, + { + "epoch": 0.30329146419730446, + "learning_rate": 0.0001393435408453287, + "loss": 0.8461, + "mean_token_accuracy": 0.7431750297546387, + "num_tokens": 76507530.0, + "step": 33080 + }, + { + "epoch": 0.3033831484367837, + "learning_rate": 0.00013932520399743286, + "loss": 0.8776, + "mean_token_accuracy": 0.738301956653595, + "num_tokens": 76529391.0, + "step": 33090 + }, + { + "epoch": 0.30347483267626296, + "learning_rate": 0.000139306867149537, + "loss": 0.8396, + "mean_token_accuracy": 0.7473569512367249, + "num_tokens": 76551653.0, + "step": 33100 + }, + { + "epoch": 0.30356651691574216, + "learning_rate": 0.00013928853030164114, + "loss": 0.8513, + "mean_token_accuracy": 0.7458438456058503, + "num_tokens": 76574931.0, + "step": 33110 + }, + { + "epoch": 0.3036582011552214, + "learning_rate": 0.0001392701934537453, + "loss": 0.8563, + "mean_token_accuracy": 0.7456990718841553, + "num_tokens": 76598160.0, + "step": 33120 + }, + { + "epoch": 0.30374988539470066, + "learning_rate": 0.00013925185660584944, + "loss": 0.8362, + "mean_token_accuracy": 0.7468683779239654, + "num_tokens": 76621926.0, + "step": 33130 + }, + { + "epoch": 0.3038415696341799, + "learning_rate": 0.00013923351975795364, + "loss": 0.8364, + "mean_token_accuracy": 0.7583596706390381, + "num_tokens": 76644602.0, + "step": 33140 + }, + { + "epoch": 0.3039332538736591, + "learning_rate": 0.00013921518291005777, + "loss": 0.839, + "mean_token_accuracy": 0.7520948767662048, + "num_tokens": 76668096.0, + "step": 33150 + }, + { + "epoch": 0.30402493811313835, + "learning_rate": 0.0001391968460621619, + "loss": 0.8453, + "mean_token_accuracy": 0.7482321858406067, + "num_tokens": 76690471.0, + "step": 33160 + }, + { + "epoch": 0.3041166223526176, + "learning_rate": 0.00013917850921426608, + "loss": 0.8555, + "mean_token_accuracy": 0.7384559750556946, + "num_tokens": 76713138.0, + "step": 33170 + }, + { + "epoch": 0.3042083065920968, + "learning_rate": 0.00013916017236637022, + "loss": 0.8736, + "mean_token_accuracy": 0.738041752576828, + "num_tokens": 76735680.0, + "step": 33180 + }, + { + "epoch": 0.30429999083157605, + "learning_rate": 0.00013914183551847438, + "loss": 0.8289, + "mean_token_accuracy": 0.7484506666660309, + "num_tokens": 76758523.0, + "step": 33190 + }, + { + "epoch": 0.3043916750710553, + "learning_rate": 0.00013912349867057855, + "loss": 0.8823, + "mean_token_accuracy": 0.7356573045253754, + "num_tokens": 76780316.0, + "step": 33200 + }, + { + "epoch": 0.3044833593105345, + "learning_rate": 0.00013910516182268269, + "loss": 0.8146, + "mean_token_accuracy": 0.749269676208496, + "num_tokens": 76803997.0, + "step": 33210 + }, + { + "epoch": 0.30457504355001375, + "learning_rate": 0.00013908682497478685, + "loss": 0.8394, + "mean_token_accuracy": 0.7488521456718444, + "num_tokens": 76826201.0, + "step": 33220 + }, + { + "epoch": 0.304666727789493, + "learning_rate": 0.000139068488126891, + "loss": 0.8409, + "mean_token_accuracy": 0.7477450549602509, + "num_tokens": 76850018.0, + "step": 33230 + }, + { + "epoch": 0.3047584120289722, + "learning_rate": 0.00013905015127899515, + "loss": 0.8543, + "mean_token_accuracy": 0.7425000071525574, + "num_tokens": 76872969.0, + "step": 33240 + }, + { + "epoch": 0.30485009626845144, + "learning_rate": 0.0001390318144310993, + "loss": 0.8581, + "mean_token_accuracy": 0.7348301351070404, + "num_tokens": 76896052.0, + "step": 33250 + }, + { + "epoch": 0.3049417805079307, + "learning_rate": 0.00013901347758320343, + "loss": 0.8316, + "mean_token_accuracy": 0.7494641184806824, + "num_tokens": 76917979.0, + "step": 33260 + }, + { + "epoch": 0.30503346474740994, + "learning_rate": 0.00013899514073530762, + "loss": 0.8406, + "mean_token_accuracy": 0.7472612977027893, + "num_tokens": 76941167.0, + "step": 33270 + }, + { + "epoch": 0.30512514898688914, + "learning_rate": 0.00013897680388741176, + "loss": 0.8588, + "mean_token_accuracy": 0.7480234622955322, + "num_tokens": 76964086.0, + "step": 33280 + }, + { + "epoch": 0.3052168332263684, + "learning_rate": 0.00013895846703951593, + "loss": 0.8368, + "mean_token_accuracy": 0.7458792328834534, + "num_tokens": 76987183.0, + "step": 33290 + }, + { + "epoch": 0.30530851746584764, + "learning_rate": 0.00013894013019162007, + "loss": 0.8663, + "mean_token_accuracy": 0.742641395330429, + "num_tokens": 77010631.0, + "step": 33300 + }, + { + "epoch": 0.30540020170532683, + "learning_rate": 0.0001389217933437242, + "loss": 0.8646, + "mean_token_accuracy": 0.7419748723506927, + "num_tokens": 77033406.0, + "step": 33310 + }, + { + "epoch": 0.3054918859448061, + "learning_rate": 0.00013890345649582837, + "loss": 0.7912, + "mean_token_accuracy": 0.760988461971283, + "num_tokens": 77056069.0, + "step": 33320 + }, + { + "epoch": 0.30558357018428534, + "learning_rate": 0.00013888511964793254, + "loss": 0.8489, + "mean_token_accuracy": 0.7463546633720398, + "num_tokens": 77079187.0, + "step": 33330 + }, + { + "epoch": 0.30567525442376453, + "learning_rate": 0.0001388667828000367, + "loss": 0.8792, + "mean_token_accuracy": 0.7405191779136657, + "num_tokens": 77101817.0, + "step": 33340 + }, + { + "epoch": 0.3057669386632438, + "learning_rate": 0.00013884844595214084, + "loss": 0.8568, + "mean_token_accuracy": 0.743732112646103, + "num_tokens": 77124917.0, + "step": 33350 + }, + { + "epoch": 0.30585862290272303, + "learning_rate": 0.00013883010910424498, + "loss": 0.8591, + "mean_token_accuracy": 0.7493031442165374, + "num_tokens": 77148323.0, + "step": 33360 + }, + { + "epoch": 0.3059503071422023, + "learning_rate": 0.00013881177225634914, + "loss": 0.828, + "mean_token_accuracy": 0.7545134902000428, + "num_tokens": 77171971.0, + "step": 33370 + }, + { + "epoch": 0.3060419913816815, + "learning_rate": 0.00013879343540845328, + "loss": 0.8334, + "mean_token_accuracy": 0.7538052439689636, + "num_tokens": 77195015.0, + "step": 33380 + }, + { + "epoch": 0.30613367562116073, + "learning_rate": 0.00013877509856055745, + "loss": 0.8962, + "mean_token_accuracy": 0.7372683942317962, + "num_tokens": 77218283.0, + "step": 33390 + }, + { + "epoch": 0.30622535986064, + "learning_rate": 0.0001387567617126616, + "loss": 0.8271, + "mean_token_accuracy": 0.7487876236438751, + "num_tokens": 77241440.0, + "step": 33400 + }, + { + "epoch": 0.3063170441001192, + "learning_rate": 0.00013873842486476575, + "loss": 0.8656, + "mean_token_accuracy": 0.7421483814716339, + "num_tokens": 77264426.0, + "step": 33410 + }, + { + "epoch": 0.3064087283395984, + "learning_rate": 0.00013872008801686992, + "loss": 0.8591, + "mean_token_accuracy": 0.7459542334079743, + "num_tokens": 77287335.0, + "step": 33420 + }, + { + "epoch": 0.3065004125790777, + "learning_rate": 0.00013870175116897405, + "loss": 0.8505, + "mean_token_accuracy": 0.7433769702911377, + "num_tokens": 77310740.0, + "step": 33430 + }, + { + "epoch": 0.30659209681855687, + "learning_rate": 0.00013868341432107822, + "loss": 0.8397, + "mean_token_accuracy": 0.7411685645580292, + "num_tokens": 77333516.0, + "step": 33440 + }, + { + "epoch": 0.3066837810580361, + "learning_rate": 0.00013866507747318236, + "loss": 0.8347, + "mean_token_accuracy": 0.7427520096302033, + "num_tokens": 77356228.0, + "step": 33450 + }, + { + "epoch": 0.30677546529751537, + "learning_rate": 0.00013864674062528652, + "loss": 0.8709, + "mean_token_accuracy": 0.7422504723072052, + "num_tokens": 77379003.0, + "step": 33460 + }, + { + "epoch": 0.30686714953699457, + "learning_rate": 0.0001386284037773907, + "loss": 0.8177, + "mean_token_accuracy": 0.7486840307712554, + "num_tokens": 77402464.0, + "step": 33470 + }, + { + "epoch": 0.3069588337764738, + "learning_rate": 0.00013861006692949483, + "loss": 0.8475, + "mean_token_accuracy": 0.7467386662960053, + "num_tokens": 77425347.0, + "step": 33480 + }, + { + "epoch": 0.30705051801595307, + "learning_rate": 0.000138591730081599, + "loss": 0.829, + "mean_token_accuracy": 0.7501772046089172, + "num_tokens": 77447614.0, + "step": 33490 + }, + { + "epoch": 0.3071422022554323, + "learning_rate": 0.00013857339323370313, + "loss": 0.8269, + "mean_token_accuracy": 0.7498204708099365, + "num_tokens": 77471207.0, + "step": 33500 + }, + { + "epoch": 0.3072338864949115, + "learning_rate": 0.00013855505638580727, + "loss": 0.841, + "mean_token_accuracy": 0.7512203574180603, + "num_tokens": 77494344.0, + "step": 33510 + }, + { + "epoch": 0.30732557073439076, + "learning_rate": 0.00013853671953791143, + "loss": 0.8561, + "mean_token_accuracy": 0.7417186796665192, + "num_tokens": 77516961.0, + "step": 33520 + }, + { + "epoch": 0.30741725497387, + "learning_rate": 0.0001385183826900156, + "loss": 0.8404, + "mean_token_accuracy": 0.7555020093917847, + "num_tokens": 77539976.0, + "step": 33530 + }, + { + "epoch": 0.3075089392133492, + "learning_rate": 0.00013850004584211976, + "loss": 0.85, + "mean_token_accuracy": 0.7431936383247375, + "num_tokens": 77563528.0, + "step": 33540 + }, + { + "epoch": 0.30760062345282846, + "learning_rate": 0.0001384817089942239, + "loss": 0.8348, + "mean_token_accuracy": 0.7480647802352905, + "num_tokens": 77586766.0, + "step": 33550 + }, + { + "epoch": 0.3076923076923077, + "learning_rate": 0.00013846337214632804, + "loss": 0.8024, + "mean_token_accuracy": 0.7537217140197754, + "num_tokens": 77609032.0, + "step": 33560 + }, + { + "epoch": 0.3077839919317869, + "learning_rate": 0.0001384450352984322, + "loss": 0.8445, + "mean_token_accuracy": 0.7477411210536957, + "num_tokens": 77632016.0, + "step": 33570 + }, + { + "epoch": 0.30787567617126615, + "learning_rate": 0.00013842669845053635, + "loss": 0.906, + "mean_token_accuracy": 0.7402415156364441, + "num_tokens": 77654913.0, + "step": 33580 + }, + { + "epoch": 0.3079673604107454, + "learning_rate": 0.0001384083616026405, + "loss": 0.8686, + "mean_token_accuracy": 0.7412020742893219, + "num_tokens": 77677818.0, + "step": 33590 + }, + { + "epoch": 0.3080590446502246, + "learning_rate": 0.00013839002475474468, + "loss": 0.8731, + "mean_token_accuracy": 0.7371971726417541, + "num_tokens": 77701930.0, + "step": 33600 + }, + { + "epoch": 0.30815072888970385, + "learning_rate": 0.00013837168790684881, + "loss": 0.844, + "mean_token_accuracy": 0.7502223968505859, + "num_tokens": 77724335.0, + "step": 33610 + }, + { + "epoch": 0.3082424131291831, + "learning_rate": 0.00013835335105895298, + "loss": 0.8432, + "mean_token_accuracy": 0.7439646542072296, + "num_tokens": 77747638.0, + "step": 33620 + }, + { + "epoch": 0.30833409736866235, + "learning_rate": 0.00013833501421105712, + "loss": 0.8704, + "mean_token_accuracy": 0.7407457113265992, + "num_tokens": 77770369.0, + "step": 33630 + }, + { + "epoch": 0.30842578160814155, + "learning_rate": 0.00013831667736316128, + "loss": 0.7746, + "mean_token_accuracy": 0.7646201491355896, + "num_tokens": 77793521.0, + "step": 33640 + }, + { + "epoch": 0.3085174658476208, + "learning_rate": 0.00013829834051526542, + "loss": 0.8796, + "mean_token_accuracy": 0.7416764795780182, + "num_tokens": 77816667.0, + "step": 33650 + }, + { + "epoch": 0.30860915008710005, + "learning_rate": 0.0001382800036673696, + "loss": 0.8788, + "mean_token_accuracy": 0.7355660200119019, + "num_tokens": 77840037.0, + "step": 33660 + }, + { + "epoch": 0.30870083432657924, + "learning_rate": 0.00013826166681947375, + "loss": 0.8006, + "mean_token_accuracy": 0.7525620520114898, + "num_tokens": 77862699.0, + "step": 33670 + }, + { + "epoch": 0.3087925185660585, + "learning_rate": 0.0001382433299715779, + "loss": 0.8562, + "mean_token_accuracy": 0.7428406774997711, + "num_tokens": 77885136.0, + "step": 33680 + }, + { + "epoch": 0.30888420280553774, + "learning_rate": 0.00013822499312368206, + "loss": 0.8449, + "mean_token_accuracy": 0.739268159866333, + "num_tokens": 77907679.0, + "step": 33690 + }, + { + "epoch": 0.30897588704501694, + "learning_rate": 0.0001382066562757862, + "loss": 0.8431, + "mean_token_accuracy": 0.7458111703395843, + "num_tokens": 77930616.0, + "step": 33700 + }, + { + "epoch": 0.3090675712844962, + "learning_rate": 0.00013818831942789033, + "loss": 0.8485, + "mean_token_accuracy": 0.7450494110584259, + "num_tokens": 77953639.0, + "step": 33710 + }, + { + "epoch": 0.30915925552397544, + "learning_rate": 0.0001381699825799945, + "loss": 0.8643, + "mean_token_accuracy": 0.7464971423149109, + "num_tokens": 77976914.0, + "step": 33720 + }, + { + "epoch": 0.30925093976345464, + "learning_rate": 0.00013815164573209866, + "loss": 0.8645, + "mean_token_accuracy": 0.7457862615585327, + "num_tokens": 77999509.0, + "step": 33730 + }, + { + "epoch": 0.3093426240029339, + "learning_rate": 0.00013813330888420283, + "loss": 0.8424, + "mean_token_accuracy": 0.7435806334018707, + "num_tokens": 78023950.0, + "step": 33740 + }, + { + "epoch": 0.30943430824241314, + "learning_rate": 0.00013811497203630697, + "loss": 0.8658, + "mean_token_accuracy": 0.7419386982917786, + "num_tokens": 78047833.0, + "step": 33750 + }, + { + "epoch": 0.3095259924818924, + "learning_rate": 0.0001380966351884111, + "loss": 0.8387, + "mean_token_accuracy": 0.7498943448066712, + "num_tokens": 78070834.0, + "step": 33760 + }, + { + "epoch": 0.3096176767213716, + "learning_rate": 0.00013807829834051527, + "loss": 0.8471, + "mean_token_accuracy": 0.7432628989219665, + "num_tokens": 78093543.0, + "step": 33770 + }, + { + "epoch": 0.30970936096085083, + "learning_rate": 0.0001380599614926194, + "loss": 0.8613, + "mean_token_accuracy": 0.7407761573791504, + "num_tokens": 78116708.0, + "step": 33780 + }, + { + "epoch": 0.3098010452003301, + "learning_rate": 0.00013804162464472358, + "loss": 0.8765, + "mean_token_accuracy": 0.7389798283576965, + "num_tokens": 78140055.0, + "step": 33790 + }, + { + "epoch": 0.3098927294398093, + "learning_rate": 0.00013802328779682774, + "loss": 0.8564, + "mean_token_accuracy": 0.750953084230423, + "num_tokens": 78163584.0, + "step": 33800 + }, + { + "epoch": 0.30998441367928853, + "learning_rate": 0.00013800495094893188, + "loss": 0.8509, + "mean_token_accuracy": 0.7473524689674378, + "num_tokens": 78186526.0, + "step": 33810 + }, + { + "epoch": 0.3100760979187678, + "learning_rate": 0.00013798661410103604, + "loss": 0.8337, + "mean_token_accuracy": 0.7452644348144531, + "num_tokens": 78209865.0, + "step": 33820 + }, + { + "epoch": 0.310167782158247, + "learning_rate": 0.00013796827725314018, + "loss": 0.8362, + "mean_token_accuracy": 0.7420852065086365, + "num_tokens": 78232857.0, + "step": 33830 + }, + { + "epoch": 0.3102594663977262, + "learning_rate": 0.00013794994040524435, + "loss": 0.8561, + "mean_token_accuracy": 0.7465553224086762, + "num_tokens": 78256639.0, + "step": 33840 + }, + { + "epoch": 0.3103511506372055, + "learning_rate": 0.00013793160355734849, + "loss": 0.8656, + "mean_token_accuracy": 0.7351106941699982, + "num_tokens": 78279723.0, + "step": 33850 + }, + { + "epoch": 0.3104428348766847, + "learning_rate": 0.00013791326670945265, + "loss": 0.8627, + "mean_token_accuracy": 0.7368688642978668, + "num_tokens": 78302587.0, + "step": 33860 + }, + { + "epoch": 0.3105345191161639, + "learning_rate": 0.00013789492986155682, + "loss": 0.8728, + "mean_token_accuracy": 0.7496148109436035, + "num_tokens": 78325276.0, + "step": 33870 + }, + { + "epoch": 0.31062620335564317, + "learning_rate": 0.00013787659301366096, + "loss": 0.8181, + "mean_token_accuracy": 0.7458925127983094, + "num_tokens": 78348670.0, + "step": 33880 + }, + { + "epoch": 0.3107178875951224, + "learning_rate": 0.00013785825616576512, + "loss": 0.8495, + "mean_token_accuracy": 0.7495343565940857, + "num_tokens": 78371576.0, + "step": 33890 + }, + { + "epoch": 0.3108095718346016, + "learning_rate": 0.00013783991931786926, + "loss": 0.872, + "mean_token_accuracy": 0.7415913641452789, + "num_tokens": 78394561.0, + "step": 33900 + }, + { + "epoch": 0.31090125607408087, + "learning_rate": 0.0001378215824699734, + "loss": 0.8622, + "mean_token_accuracy": 0.7382225751876831, + "num_tokens": 78417398.0, + "step": 33910 + }, + { + "epoch": 0.3109929403135601, + "learning_rate": 0.0001378032456220776, + "loss": 0.8453, + "mean_token_accuracy": 0.7446352064609527, + "num_tokens": 78439842.0, + "step": 33920 + }, + { + "epoch": 0.3110846245530393, + "learning_rate": 0.00013778490877418173, + "loss": 0.8918, + "mean_token_accuracy": 0.7458747148513794, + "num_tokens": 78462547.0, + "step": 33930 + }, + { + "epoch": 0.31117630879251856, + "learning_rate": 0.0001377665719262859, + "loss": 0.8929, + "mean_token_accuracy": 0.7326566874980927, + "num_tokens": 78485928.0, + "step": 33940 + }, + { + "epoch": 0.3112679930319978, + "learning_rate": 0.00013774823507839003, + "loss": 0.8453, + "mean_token_accuracy": 0.7494336009025574, + "num_tokens": 78508363.0, + "step": 33950 + }, + { + "epoch": 0.311359677271477, + "learning_rate": 0.00013772989823049417, + "loss": 0.8582, + "mean_token_accuracy": 0.7438672244548797, + "num_tokens": 78531327.0, + "step": 33960 + }, + { + "epoch": 0.31145136151095626, + "learning_rate": 0.00013771156138259834, + "loss": 0.8786, + "mean_token_accuracy": 0.7443876504898072, + "num_tokens": 78555046.0, + "step": 33970 + }, + { + "epoch": 0.3115430457504355, + "learning_rate": 0.00013769322453470247, + "loss": 0.8256, + "mean_token_accuracy": 0.7507291913032532, + "num_tokens": 78577902.0, + "step": 33980 + }, + { + "epoch": 0.31163472998991476, + "learning_rate": 0.00013767488768680664, + "loss": 0.8639, + "mean_token_accuracy": 0.7446135640144348, + "num_tokens": 78600485.0, + "step": 33990 + }, + { + "epoch": 0.31172641422939396, + "learning_rate": 0.0001376565508389108, + "loss": 0.871, + "mean_token_accuracy": 0.7453547239303588, + "num_tokens": 78622655.0, + "step": 34000 + }, + { + "epoch": 0.3118180984688732, + "learning_rate": 0.00013763821399101494, + "loss": 0.8801, + "mean_token_accuracy": 0.7399561107158661, + "num_tokens": 78646145.0, + "step": 34010 + }, + { + "epoch": 0.31190978270835246, + "learning_rate": 0.0001376198771431191, + "loss": 0.8625, + "mean_token_accuracy": 0.7371825695037841, + "num_tokens": 78669868.0, + "step": 34020 + }, + { + "epoch": 0.31200146694783165, + "learning_rate": 0.00013760154029522325, + "loss": 0.8354, + "mean_token_accuracy": 0.7505948424339295, + "num_tokens": 78692541.0, + "step": 34030 + }, + { + "epoch": 0.3120931511873109, + "learning_rate": 0.0001375832034473274, + "loss": 0.8324, + "mean_token_accuracy": 0.7473336160182953, + "num_tokens": 78715340.0, + "step": 34040 + }, + { + "epoch": 0.31218483542679015, + "learning_rate": 0.00013756486659943158, + "loss": 0.8658, + "mean_token_accuracy": 0.7392273724079133, + "num_tokens": 78737797.0, + "step": 34050 + }, + { + "epoch": 0.31227651966626935, + "learning_rate": 0.00013754652975153572, + "loss": 0.8339, + "mean_token_accuracy": 0.7455706655979156, + "num_tokens": 78760741.0, + "step": 34060 + }, + { + "epoch": 0.3123682039057486, + "learning_rate": 0.00013752819290363988, + "loss": 0.8897, + "mean_token_accuracy": 0.7384982705116272, + "num_tokens": 78785235.0, + "step": 34070 + }, + { + "epoch": 0.31245988814522785, + "learning_rate": 0.00013750985605574402, + "loss": 0.8657, + "mean_token_accuracy": 0.7436144709587097, + "num_tokens": 78808390.0, + "step": 34080 + }, + { + "epoch": 0.31255157238470704, + "learning_rate": 0.00013749151920784819, + "loss": 0.8453, + "mean_token_accuracy": 0.742193204164505, + "num_tokens": 78831392.0, + "step": 34090 + }, + { + "epoch": 0.3126432566241863, + "learning_rate": 0.00013747318235995232, + "loss": 0.8323, + "mean_token_accuracy": 0.741822338104248, + "num_tokens": 78854868.0, + "step": 34100 + }, + { + "epoch": 0.31273494086366554, + "learning_rate": 0.00013745484551205646, + "loss": 0.7973, + "mean_token_accuracy": 0.7539364516735076, + "num_tokens": 78877421.0, + "step": 34110 + }, + { + "epoch": 0.3128266251031448, + "learning_rate": 0.00013743650866416065, + "loss": 0.8239, + "mean_token_accuracy": 0.7552946329116821, + "num_tokens": 78901198.0, + "step": 34120 + }, + { + "epoch": 0.312918309342624, + "learning_rate": 0.0001374181718162648, + "loss": 0.8978, + "mean_token_accuracy": 0.7341907978057861, + "num_tokens": 78923534.0, + "step": 34130 + }, + { + "epoch": 0.31300999358210324, + "learning_rate": 0.00013739983496836896, + "loss": 0.8733, + "mean_token_accuracy": 0.7404236376285553, + "num_tokens": 78946443.0, + "step": 34140 + }, + { + "epoch": 0.3131016778215825, + "learning_rate": 0.0001373814981204731, + "loss": 0.8332, + "mean_token_accuracy": 0.7449717223644257, + "num_tokens": 78970146.0, + "step": 34150 + }, + { + "epoch": 0.3131933620610617, + "learning_rate": 0.00013736316127257723, + "loss": 0.8517, + "mean_token_accuracy": 0.7426335871219635, + "num_tokens": 78992758.0, + "step": 34160 + }, + { + "epoch": 0.31328504630054094, + "learning_rate": 0.0001373448244246814, + "loss": 0.8367, + "mean_token_accuracy": 0.750715833902359, + "num_tokens": 79015249.0, + "step": 34170 + }, + { + "epoch": 0.3133767305400202, + "learning_rate": 0.00013732648757678557, + "loss": 0.8978, + "mean_token_accuracy": 0.7321100652217865, + "num_tokens": 79037518.0, + "step": 34180 + }, + { + "epoch": 0.3134684147794994, + "learning_rate": 0.0001373081507288897, + "loss": 0.8428, + "mean_token_accuracy": 0.7446274638175965, + "num_tokens": 79060436.0, + "step": 34190 + }, + { + "epoch": 0.31356009901897863, + "learning_rate": 0.00013728981388099387, + "loss": 0.8593, + "mean_token_accuracy": 0.743911737203598, + "num_tokens": 79083372.0, + "step": 34200 + }, + { + "epoch": 0.3136517832584579, + "learning_rate": 0.000137271477033098, + "loss": 0.8306, + "mean_token_accuracy": 0.7476195931434632, + "num_tokens": 79106779.0, + "step": 34210 + }, + { + "epoch": 0.3137434674979371, + "learning_rate": 0.00013725314018520217, + "loss": 0.8751, + "mean_token_accuracy": 0.7391022264957428, + "num_tokens": 79129618.0, + "step": 34220 + }, + { + "epoch": 0.31383515173741633, + "learning_rate": 0.0001372348033373063, + "loss": 0.8712, + "mean_token_accuracy": 0.7366578221321106, + "num_tokens": 79152007.0, + "step": 34230 + }, + { + "epoch": 0.3139268359768956, + "learning_rate": 0.00013721646648941048, + "loss": 0.7959, + "mean_token_accuracy": 0.7588099181652069, + "num_tokens": 79175125.0, + "step": 34240 + }, + { + "epoch": 0.31401852021637483, + "learning_rate": 0.00013719812964151464, + "loss": 0.8432, + "mean_token_accuracy": 0.7426735818386078, + "num_tokens": 79198722.0, + "step": 34250 + }, + { + "epoch": 0.314110204455854, + "learning_rate": 0.00013717979279361878, + "loss": 0.8843, + "mean_token_accuracy": 0.734452360868454, + "num_tokens": 79221976.0, + "step": 34260 + }, + { + "epoch": 0.3142018886953333, + "learning_rate": 0.00013716145594572295, + "loss": 0.8364, + "mean_token_accuracy": 0.7462021052837372, + "num_tokens": 79245526.0, + "step": 34270 + }, + { + "epoch": 0.3142935729348125, + "learning_rate": 0.00013714311909782708, + "loss": 0.8156, + "mean_token_accuracy": 0.7524182617664337, + "num_tokens": 79268613.0, + "step": 34280 + }, + { + "epoch": 0.3143852571742917, + "learning_rate": 0.00013712478224993125, + "loss": 0.8682, + "mean_token_accuracy": 0.7409781634807586, + "num_tokens": 79291659.0, + "step": 34290 + }, + { + "epoch": 0.31447694141377097, + "learning_rate": 0.0001371064454020354, + "loss": 0.8433, + "mean_token_accuracy": 0.7476778864860535, + "num_tokens": 79315501.0, + "step": 34300 + }, + { + "epoch": 0.3145686256532502, + "learning_rate": 0.00013708810855413955, + "loss": 0.86, + "mean_token_accuracy": 0.7427622258663178, + "num_tokens": 79338230.0, + "step": 34310 + }, + { + "epoch": 0.3146603098927294, + "learning_rate": 0.00013706977170624372, + "loss": 0.8422, + "mean_token_accuracy": 0.7434896886348724, + "num_tokens": 79361510.0, + "step": 34320 + }, + { + "epoch": 0.31475199413220867, + "learning_rate": 0.00013705143485834786, + "loss": 0.8829, + "mean_token_accuracy": 0.7420975625514984, + "num_tokens": 79384636.0, + "step": 34330 + }, + { + "epoch": 0.3148436783716879, + "learning_rate": 0.00013703309801045202, + "loss": 0.8748, + "mean_token_accuracy": 0.739655327796936, + "num_tokens": 79407919.0, + "step": 34340 + }, + { + "epoch": 0.3149353626111671, + "learning_rate": 0.00013701476116255616, + "loss": 0.8858, + "mean_token_accuracy": 0.7402777910232544, + "num_tokens": 79430699.0, + "step": 34350 + }, + { + "epoch": 0.31502704685064636, + "learning_rate": 0.0001369964243146603, + "loss": 0.8899, + "mean_token_accuracy": 0.736571878194809, + "num_tokens": 79453750.0, + "step": 34360 + }, + { + "epoch": 0.3151187310901256, + "learning_rate": 0.00013697808746676446, + "loss": 0.8438, + "mean_token_accuracy": 0.7471187770366668, + "num_tokens": 79476905.0, + "step": 34370 + }, + { + "epoch": 0.31521041532960486, + "learning_rate": 0.00013695975061886863, + "loss": 0.812, + "mean_token_accuracy": 0.7540494322776794, + "num_tokens": 79499697.0, + "step": 34380 + }, + { + "epoch": 0.31530209956908406, + "learning_rate": 0.00013694141377097277, + "loss": 0.8571, + "mean_token_accuracy": 0.7447143197059631, + "num_tokens": 79523491.0, + "step": 34390 + }, + { + "epoch": 0.3153937838085633, + "learning_rate": 0.00013692307692307693, + "loss": 0.8662, + "mean_token_accuracy": 0.7435140669345855, + "num_tokens": 79546953.0, + "step": 34400 + }, + { + "epoch": 0.31548546804804256, + "learning_rate": 0.00013690474007518107, + "loss": 0.85, + "mean_token_accuracy": 0.7524021387100219, + "num_tokens": 79569717.0, + "step": 34410 + }, + { + "epoch": 0.31557715228752176, + "learning_rate": 0.00013688640322728524, + "loss": 0.8186, + "mean_token_accuracy": 0.7480797469615936, + "num_tokens": 79593407.0, + "step": 34420 + }, + { + "epoch": 0.315668836527001, + "learning_rate": 0.00013686806637938938, + "loss": 0.8711, + "mean_token_accuracy": 0.7463244736194611, + "num_tokens": 79616375.0, + "step": 34430 + }, + { + "epoch": 0.31576052076648026, + "learning_rate": 0.00013684972953149354, + "loss": 0.8918, + "mean_token_accuracy": 0.7361148715019226, + "num_tokens": 79639236.0, + "step": 34440 + }, + { + "epoch": 0.31585220500595945, + "learning_rate": 0.0001368313926835977, + "loss": 0.8359, + "mean_token_accuracy": 0.7510080814361573, + "num_tokens": 79663088.0, + "step": 34450 + }, + { + "epoch": 0.3159438892454387, + "learning_rate": 0.00013681305583570185, + "loss": 0.8547, + "mean_token_accuracy": 0.7443218410015107, + "num_tokens": 79686905.0, + "step": 34460 + }, + { + "epoch": 0.31603557348491795, + "learning_rate": 0.000136794718987806, + "loss": 0.856, + "mean_token_accuracy": 0.7426484644412994, + "num_tokens": 79709982.0, + "step": 34470 + }, + { + "epoch": 0.3161272577243972, + "learning_rate": 0.00013677638213991015, + "loss": 0.8664, + "mean_token_accuracy": 0.7364355206489563, + "num_tokens": 79732331.0, + "step": 34480 + }, + { + "epoch": 0.3162189419638764, + "learning_rate": 0.00013675804529201431, + "loss": 0.8169, + "mean_token_accuracy": 0.7513714134693146, + "num_tokens": 79755980.0, + "step": 34490 + }, + { + "epoch": 0.31631062620335565, + "learning_rate": 0.00013673970844411845, + "loss": 0.7929, + "mean_token_accuracy": 0.7554454922676086, + "num_tokens": 79779575.0, + "step": 34500 + }, + { + "epoch": 0.3164023104428349, + "learning_rate": 0.00013672137159622262, + "loss": 0.8262, + "mean_token_accuracy": 0.7452967226505279, + "num_tokens": 79803051.0, + "step": 34510 + }, + { + "epoch": 0.3164939946823141, + "learning_rate": 0.00013670303474832678, + "loss": 0.7819, + "mean_token_accuracy": 0.7652263939380646, + "num_tokens": 79825345.0, + "step": 34520 + }, + { + "epoch": 0.31658567892179335, + "learning_rate": 0.00013668469790043092, + "loss": 0.8494, + "mean_token_accuracy": 0.7425295948982239, + "num_tokens": 79848108.0, + "step": 34530 + }, + { + "epoch": 0.3166773631612726, + "learning_rate": 0.0001366663610525351, + "loss": 0.8818, + "mean_token_accuracy": 0.7419913232326507, + "num_tokens": 79871056.0, + "step": 34540 + }, + { + "epoch": 0.3167690474007518, + "learning_rate": 0.00013664802420463923, + "loss": 0.8669, + "mean_token_accuracy": 0.7456808865070343, + "num_tokens": 79894582.0, + "step": 34550 + }, + { + "epoch": 0.31686073164023104, + "learning_rate": 0.00013662968735674336, + "loss": 0.8165, + "mean_token_accuracy": 0.7550671517848968, + "num_tokens": 79917591.0, + "step": 34560 + }, + { + "epoch": 0.3169524158797103, + "learning_rate": 0.00013661135050884756, + "loss": 0.8877, + "mean_token_accuracy": 0.7403483629226685, + "num_tokens": 79940644.0, + "step": 34570 + }, + { + "epoch": 0.3170441001191895, + "learning_rate": 0.0001365930136609517, + "loss": 0.8556, + "mean_token_accuracy": 0.7453246176242828, + "num_tokens": 79964170.0, + "step": 34580 + }, + { + "epoch": 0.31713578435866874, + "learning_rate": 0.00013657467681305583, + "loss": 0.8926, + "mean_token_accuracy": 0.7324411630630493, + "num_tokens": 79987016.0, + "step": 34590 + }, + { + "epoch": 0.317227468598148, + "learning_rate": 0.00013655633996516, + "loss": 0.8397, + "mean_token_accuracy": 0.7431699335575104, + "num_tokens": 80010734.0, + "step": 34600 + }, + { + "epoch": 0.31731915283762724, + "learning_rate": 0.00013653800311726414, + "loss": 0.8842, + "mean_token_accuracy": 0.7378191828727723, + "num_tokens": 80033339.0, + "step": 34610 + }, + { + "epoch": 0.31741083707710643, + "learning_rate": 0.0001365196662693683, + "loss": 0.8356, + "mean_token_accuracy": 0.7426839649677277, + "num_tokens": 80056594.0, + "step": 34620 + }, + { + "epoch": 0.3175025213165857, + "learning_rate": 0.00013650132942147244, + "loss": 0.844, + "mean_token_accuracy": 0.7452988803386689, + "num_tokens": 80079577.0, + "step": 34630 + }, + { + "epoch": 0.31759420555606493, + "learning_rate": 0.0001364829925735766, + "loss": 0.8824, + "mean_token_accuracy": 0.7362828552722931, + "num_tokens": 80102624.0, + "step": 34640 + }, + { + "epoch": 0.31768588979554413, + "learning_rate": 0.00013646465572568077, + "loss": 0.8498, + "mean_token_accuracy": 0.7441802263259888, + "num_tokens": 80125360.0, + "step": 34650 + }, + { + "epoch": 0.3177775740350234, + "learning_rate": 0.0001364463188777849, + "loss": 0.8345, + "mean_token_accuracy": 0.7502237677574157, + "num_tokens": 80148354.0, + "step": 34660 + }, + { + "epoch": 0.31786925827450263, + "learning_rate": 0.00013642798202988908, + "loss": 0.8152, + "mean_token_accuracy": 0.755932092666626, + "num_tokens": 80171617.0, + "step": 34670 + }, + { + "epoch": 0.3179609425139818, + "learning_rate": 0.0001364096451819932, + "loss": 0.8789, + "mean_token_accuracy": 0.7385014951229095, + "num_tokens": 80194206.0, + "step": 34680 + }, + { + "epoch": 0.3180526267534611, + "learning_rate": 0.00013639130833409738, + "loss": 0.833, + "mean_token_accuracy": 0.7461274921894073, + "num_tokens": 80217109.0, + "step": 34690 + }, + { + "epoch": 0.3181443109929403, + "learning_rate": 0.00013637297148620154, + "loss": 0.8276, + "mean_token_accuracy": 0.7556744992733002, + "num_tokens": 80241261.0, + "step": 34700 + }, + { + "epoch": 0.3182359952324195, + "learning_rate": 0.00013635463463830568, + "loss": 0.8475, + "mean_token_accuracy": 0.744313532114029, + "num_tokens": 80263934.0, + "step": 34710 + }, + { + "epoch": 0.3183276794718988, + "learning_rate": 0.00013633629779040985, + "loss": 0.8051, + "mean_token_accuracy": 0.7545833706855773, + "num_tokens": 80286978.0, + "step": 34720 + }, + { + "epoch": 0.318419363711378, + "learning_rate": 0.00013631796094251399, + "loss": 0.8466, + "mean_token_accuracy": 0.7389474272727966, + "num_tokens": 80309883.0, + "step": 34730 + }, + { + "epoch": 0.3185110479508573, + "learning_rate": 0.00013629962409461815, + "loss": 0.8129, + "mean_token_accuracy": 0.7531138718128204, + "num_tokens": 80333232.0, + "step": 34740 + }, + { + "epoch": 0.31860273219033647, + "learning_rate": 0.0001362812872467223, + "loss": 0.8768, + "mean_token_accuracy": 0.7434490025043488, + "num_tokens": 80356688.0, + "step": 34750 + }, + { + "epoch": 0.3186944164298157, + "learning_rate": 0.00013626295039882643, + "loss": 0.8695, + "mean_token_accuracy": 0.745382410287857, + "num_tokens": 80380400.0, + "step": 34760 + }, + { + "epoch": 0.31878610066929497, + "learning_rate": 0.00013624461355093062, + "loss": 0.8694, + "mean_token_accuracy": 0.7431151747703553, + "num_tokens": 80403509.0, + "step": 34770 + }, + { + "epoch": 0.31887778490877416, + "learning_rate": 0.00013622627670303476, + "loss": 0.8542, + "mean_token_accuracy": 0.744390344619751, + "num_tokens": 80426896.0, + "step": 34780 + }, + { + "epoch": 0.3189694691482534, + "learning_rate": 0.0001362079398551389, + "loss": 0.8722, + "mean_token_accuracy": 0.7442276298999786, + "num_tokens": 80448749.0, + "step": 34790 + }, + { + "epoch": 0.31906115338773267, + "learning_rate": 0.00013618960300724306, + "loss": 0.8527, + "mean_token_accuracy": 0.7401118993759155, + "num_tokens": 80472387.0, + "step": 34800 + }, + { + "epoch": 0.31915283762721186, + "learning_rate": 0.0001361712661593472, + "loss": 0.853, + "mean_token_accuracy": 0.7415448069572449, + "num_tokens": 80495804.0, + "step": 34810 + }, + { + "epoch": 0.3192445218666911, + "learning_rate": 0.00013615292931145137, + "loss": 0.884, + "mean_token_accuracy": 0.7414491415023804, + "num_tokens": 80518247.0, + "step": 34820 + }, + { + "epoch": 0.31933620610617036, + "learning_rate": 0.0001361345924635555, + "loss": 0.8345, + "mean_token_accuracy": 0.7462976157665253, + "num_tokens": 80540939.0, + "step": 34830 + }, + { + "epoch": 0.31942789034564956, + "learning_rate": 0.00013611625561565967, + "loss": 0.8488, + "mean_token_accuracy": 0.7435784935951233, + "num_tokens": 80563840.0, + "step": 34840 + }, + { + "epoch": 0.3195195745851288, + "learning_rate": 0.00013609791876776384, + "loss": 0.8363, + "mean_token_accuracy": 0.7504896581172943, + "num_tokens": 80586742.0, + "step": 34850 + }, + { + "epoch": 0.31961125882460806, + "learning_rate": 0.00013607958191986797, + "loss": 0.8243, + "mean_token_accuracy": 0.7462678611278534, + "num_tokens": 80609657.0, + "step": 34860 + }, + { + "epoch": 0.3197029430640873, + "learning_rate": 0.00013606124507197214, + "loss": 0.8625, + "mean_token_accuracy": 0.7398136258125305, + "num_tokens": 80632678.0, + "step": 34870 + }, + { + "epoch": 0.3197946273035665, + "learning_rate": 0.00013604290822407628, + "loss": 0.8364, + "mean_token_accuracy": 0.7386039614677429, + "num_tokens": 80655452.0, + "step": 34880 + }, + { + "epoch": 0.31988631154304575, + "learning_rate": 0.00013602457137618044, + "loss": 0.837, + "mean_token_accuracy": 0.7428508758544922, + "num_tokens": 80678008.0, + "step": 34890 + }, + { + "epoch": 0.319977995782525, + "learning_rate": 0.0001360062345282846, + "loss": 0.8642, + "mean_token_accuracy": 0.7445224344730377, + "num_tokens": 80701095.0, + "step": 34900 + }, + { + "epoch": 0.3200696800220042, + "learning_rate": 0.00013598789768038875, + "loss": 0.8355, + "mean_token_accuracy": 0.751128089427948, + "num_tokens": 80723753.0, + "step": 34910 + }, + { + "epoch": 0.32016136426148345, + "learning_rate": 0.0001359695608324929, + "loss": 0.8031, + "mean_token_accuracy": 0.760913074016571, + "num_tokens": 80746750.0, + "step": 34920 + }, + { + "epoch": 0.3202530485009627, + "learning_rate": 0.00013595122398459705, + "loss": 0.8555, + "mean_token_accuracy": 0.7404983341693878, + "num_tokens": 80770039.0, + "step": 34930 + }, + { + "epoch": 0.3203447327404419, + "learning_rate": 0.00013593288713670122, + "loss": 0.865, + "mean_token_accuracy": 0.7448597013950348, + "num_tokens": 80793367.0, + "step": 34940 + }, + { + "epoch": 0.32043641697992115, + "learning_rate": 0.00013591455028880535, + "loss": 0.8405, + "mean_token_accuracy": 0.7469914615154266, + "num_tokens": 80815752.0, + "step": 34950 + }, + { + "epoch": 0.3205281012194004, + "learning_rate": 0.0001358962134409095, + "loss": 0.8223, + "mean_token_accuracy": 0.750765734910965, + "num_tokens": 80838887.0, + "step": 34960 + }, + { + "epoch": 0.3206197854588796, + "learning_rate": 0.00013587787659301369, + "loss": 0.8391, + "mean_token_accuracy": 0.7528128325939178, + "num_tokens": 80862533.0, + "step": 34970 + }, + { + "epoch": 0.32071146969835884, + "learning_rate": 0.00013585953974511782, + "loss": 0.8555, + "mean_token_accuracy": 0.7497487127780914, + "num_tokens": 80886573.0, + "step": 34980 + }, + { + "epoch": 0.3208031539378381, + "learning_rate": 0.00013584120289722196, + "loss": 0.8568, + "mean_token_accuracy": 0.7458373665809631, + "num_tokens": 80909588.0, + "step": 34990 + }, + { + "epoch": 0.32089483817731734, + "learning_rate": 0.00013582286604932613, + "loss": 0.8015, + "mean_token_accuracy": 0.7568274974822998, + "num_tokens": 80932614.0, + "step": 35000 + }, + { + "epoch": 0.32098652241679654, + "learning_rate": 0.00013580452920143027, + "loss": 0.879, + "mean_token_accuracy": 0.7383477210998535, + "num_tokens": 80955131.0, + "step": 35010 + }, + { + "epoch": 0.3210782066562758, + "learning_rate": 0.00013578619235353443, + "loss": 0.8513, + "mean_token_accuracy": 0.744678795337677, + "num_tokens": 80978554.0, + "step": 35020 + }, + { + "epoch": 0.32116989089575504, + "learning_rate": 0.0001357678555056386, + "loss": 0.7966, + "mean_token_accuracy": 0.7619555592536926, + "num_tokens": 81001515.0, + "step": 35030 + }, + { + "epoch": 0.32126157513523423, + "learning_rate": 0.00013574951865774273, + "loss": 0.8469, + "mean_token_accuracy": 0.7381498634815216, + "num_tokens": 81023827.0, + "step": 35040 + }, + { + "epoch": 0.3213532593747135, + "learning_rate": 0.0001357311818098469, + "loss": 0.8705, + "mean_token_accuracy": 0.7359326004981994, + "num_tokens": 81047193.0, + "step": 35050 + }, + { + "epoch": 0.32144494361419274, + "learning_rate": 0.00013571284496195104, + "loss": 0.8265, + "mean_token_accuracy": 0.7469355463981628, + "num_tokens": 81069044.0, + "step": 35060 + }, + { + "epoch": 0.32153662785367193, + "learning_rate": 0.0001356945081140552, + "loss": 0.8521, + "mean_token_accuracy": 0.7443061113357544, + "num_tokens": 81092424.0, + "step": 35070 + }, + { + "epoch": 0.3216283120931512, + "learning_rate": 0.00013567617126615934, + "loss": 0.8384, + "mean_token_accuracy": 0.7469860255718231, + "num_tokens": 81114963.0, + "step": 35080 + }, + { + "epoch": 0.32171999633263043, + "learning_rate": 0.0001356578344182635, + "loss": 0.8614, + "mean_token_accuracy": 0.7420911133289337, + "num_tokens": 81138069.0, + "step": 35090 + }, + { + "epoch": 0.3218116805721097, + "learning_rate": 0.00013563949757036767, + "loss": 0.8629, + "mean_token_accuracy": 0.7411840558052063, + "num_tokens": 81160431.0, + "step": 35100 + }, + { + "epoch": 0.3219033648115889, + "learning_rate": 0.0001356211607224718, + "loss": 0.8427, + "mean_token_accuracy": 0.7432519495487213, + "num_tokens": 81182957.0, + "step": 35110 + }, + { + "epoch": 0.3219950490510681, + "learning_rate": 0.00013560282387457598, + "loss": 0.8548, + "mean_token_accuracy": 0.748400354385376, + "num_tokens": 81205478.0, + "step": 35120 + }, + { + "epoch": 0.3220867332905474, + "learning_rate": 0.00013558448702668012, + "loss": 0.8344, + "mean_token_accuracy": 0.7453448891639709, + "num_tokens": 81229441.0, + "step": 35130 + }, + { + "epoch": 0.3221784175300266, + "learning_rate": 0.00013556615017878428, + "loss": 0.8525, + "mean_token_accuracy": 0.7415412187576294, + "num_tokens": 81251897.0, + "step": 35140 + }, + { + "epoch": 0.3222701017695058, + "learning_rate": 0.00013554781333088842, + "loss": 0.8785, + "mean_token_accuracy": 0.7355118870735169, + "num_tokens": 81274628.0, + "step": 35150 + }, + { + "epoch": 0.3223617860089851, + "learning_rate": 0.00013552947648299258, + "loss": 0.8675, + "mean_token_accuracy": 0.7326271176338196, + "num_tokens": 81297257.0, + "step": 35160 + }, + { + "epoch": 0.32245347024846427, + "learning_rate": 0.00013551113963509675, + "loss": 0.8415, + "mean_token_accuracy": 0.7444237768650055, + "num_tokens": 81320642.0, + "step": 35170 + }, + { + "epoch": 0.3225451544879435, + "learning_rate": 0.0001354928027872009, + "loss": 0.8489, + "mean_token_accuracy": 0.7437173664569855, + "num_tokens": 81343977.0, + "step": 35180 + }, + { + "epoch": 0.32263683872742277, + "learning_rate": 0.00013547446593930503, + "loss": 0.8649, + "mean_token_accuracy": 0.7386248350143433, + "num_tokens": 81366711.0, + "step": 35190 + }, + { + "epoch": 0.32272852296690197, + "learning_rate": 0.0001354561290914092, + "loss": 0.857, + "mean_token_accuracy": 0.7472717225551605, + "num_tokens": 81389605.0, + "step": 35200 + }, + { + "epoch": 0.3228202072063812, + "learning_rate": 0.00013543779224351333, + "loss": 0.8268, + "mean_token_accuracy": 0.7485568761825562, + "num_tokens": 81412276.0, + "step": 35210 + }, + { + "epoch": 0.32291189144586047, + "learning_rate": 0.0001354194553956175, + "loss": 0.8081, + "mean_token_accuracy": 0.7577523529529572, + "num_tokens": 81435050.0, + "step": 35220 + }, + { + "epoch": 0.3230035756853397, + "learning_rate": 0.00013540111854772166, + "loss": 0.8157, + "mean_token_accuracy": 0.7532997727394104, + "num_tokens": 81458130.0, + "step": 35230 + }, + { + "epoch": 0.3230952599248189, + "learning_rate": 0.0001353827816998258, + "loss": 0.8404, + "mean_token_accuracy": 0.7457041919231415, + "num_tokens": 81481495.0, + "step": 35240 + }, + { + "epoch": 0.32318694416429816, + "learning_rate": 0.00013536444485192996, + "loss": 0.8819, + "mean_token_accuracy": 0.7388751924037933, + "num_tokens": 81504352.0, + "step": 35250 + }, + { + "epoch": 0.3232786284037774, + "learning_rate": 0.0001353461080040341, + "loss": 0.8456, + "mean_token_accuracy": 0.7405800104141236, + "num_tokens": 81527779.0, + "step": 35260 + }, + { + "epoch": 0.3233703126432566, + "learning_rate": 0.00013532777115613827, + "loss": 0.8478, + "mean_token_accuracy": 0.7437808692455292, + "num_tokens": 81550871.0, + "step": 35270 + }, + { + "epoch": 0.32346199688273586, + "learning_rate": 0.0001353094343082424, + "loss": 0.8436, + "mean_token_accuracy": 0.7423400282859802, + "num_tokens": 81574427.0, + "step": 35280 + }, + { + "epoch": 0.3235536811222151, + "learning_rate": 0.00013529109746034657, + "loss": 0.8545, + "mean_token_accuracy": 0.7487216591835022, + "num_tokens": 81596950.0, + "step": 35290 + }, + { + "epoch": 0.3236453653616943, + "learning_rate": 0.00013527276061245074, + "loss": 0.8621, + "mean_token_accuracy": 0.7433628737926483, + "num_tokens": 81619335.0, + "step": 35300 + }, + { + "epoch": 0.32373704960117355, + "learning_rate": 0.00013525442376455488, + "loss": 0.8204, + "mean_token_accuracy": 0.7557617902755738, + "num_tokens": 81642327.0, + "step": 35310 + }, + { + "epoch": 0.3238287338406528, + "learning_rate": 0.00013523608691665904, + "loss": 0.8274, + "mean_token_accuracy": 0.7449274480342865, + "num_tokens": 81665850.0, + "step": 35320 + }, + { + "epoch": 0.323920418080132, + "learning_rate": 0.00013521775006876318, + "loss": 0.8801, + "mean_token_accuracy": 0.743822056055069, + "num_tokens": 81688793.0, + "step": 35330 + }, + { + "epoch": 0.32401210231961125, + "learning_rate": 0.00013519941322086735, + "loss": 0.8587, + "mean_token_accuracy": 0.7431145966053009, + "num_tokens": 81711704.0, + "step": 35340 + }, + { + "epoch": 0.3241037865590905, + "learning_rate": 0.00013518107637297148, + "loss": 0.8845, + "mean_token_accuracy": 0.7453645706176758, + "num_tokens": 81734610.0, + "step": 35350 + }, + { + "epoch": 0.32419547079856975, + "learning_rate": 0.00013516273952507565, + "loss": 0.8195, + "mean_token_accuracy": 0.7508151352405548, + "num_tokens": 81757684.0, + "step": 35360 + }, + { + "epoch": 0.32428715503804895, + "learning_rate": 0.00013514440267717981, + "loss": 0.8429, + "mean_token_accuracy": 0.7492231905460358, + "num_tokens": 81781581.0, + "step": 35370 + }, + { + "epoch": 0.3243788392775282, + "learning_rate": 0.00013512606582928395, + "loss": 0.795, + "mean_token_accuracy": 0.7528245329856873, + "num_tokens": 81803708.0, + "step": 35380 + }, + { + "epoch": 0.32447052351700745, + "learning_rate": 0.0001351077289813881, + "loss": 0.8331, + "mean_token_accuracy": 0.7523864388465882, + "num_tokens": 81826149.0, + "step": 35390 + }, + { + "epoch": 0.32456220775648664, + "learning_rate": 0.00013508939213349226, + "loss": 0.8414, + "mean_token_accuracy": 0.7468234360218048, + "num_tokens": 81849109.0, + "step": 35400 + }, + { + "epoch": 0.3246538919959659, + "learning_rate": 0.0001350710552855964, + "loss": 0.8618, + "mean_token_accuracy": 0.7513863444328308, + "num_tokens": 81872404.0, + "step": 35410 + }, + { + "epoch": 0.32474557623544514, + "learning_rate": 0.0001350527184377006, + "loss": 0.8337, + "mean_token_accuracy": 0.7513627886772156, + "num_tokens": 81895299.0, + "step": 35420 + }, + { + "epoch": 0.32483726047492434, + "learning_rate": 0.00013503438158980473, + "loss": 0.8311, + "mean_token_accuracy": 0.7515579104423523, + "num_tokens": 81918391.0, + "step": 35430 + }, + { + "epoch": 0.3249289447144036, + "learning_rate": 0.00013501604474190886, + "loss": 0.8473, + "mean_token_accuracy": 0.7471840679645538, + "num_tokens": 81941487.0, + "step": 35440 + }, + { + "epoch": 0.32502062895388284, + "learning_rate": 0.00013499770789401303, + "loss": 0.8646, + "mean_token_accuracy": 0.7400823950767517, + "num_tokens": 81964909.0, + "step": 35450 + }, + { + "epoch": 0.32511231319336203, + "learning_rate": 0.00013497937104611717, + "loss": 0.8316, + "mean_token_accuracy": 0.7515281498432159, + "num_tokens": 81988848.0, + "step": 35460 + }, + { + "epoch": 0.3252039974328413, + "learning_rate": 0.00013496103419822133, + "loss": 0.8309, + "mean_token_accuracy": 0.7513287782669067, + "num_tokens": 82012459.0, + "step": 35470 + }, + { + "epoch": 0.32529568167232054, + "learning_rate": 0.00013494269735032547, + "loss": 0.8645, + "mean_token_accuracy": 0.740870189666748, + "num_tokens": 82036273.0, + "step": 35480 + }, + { + "epoch": 0.3253873659117998, + "learning_rate": 0.00013492436050242964, + "loss": 0.8206, + "mean_token_accuracy": 0.7488671004772186, + "num_tokens": 82058919.0, + "step": 35490 + }, + { + "epoch": 0.325479050151279, + "learning_rate": 0.0001349060236545338, + "loss": 0.8227, + "mean_token_accuracy": 0.7483937859535217, + "num_tokens": 82081852.0, + "step": 35500 + }, + { + "epoch": 0.32557073439075823, + "learning_rate": 0.00013488768680663794, + "loss": 0.8724, + "mean_token_accuracy": 0.7361494719982147, + "num_tokens": 82104310.0, + "step": 35510 + }, + { + "epoch": 0.3256624186302375, + "learning_rate": 0.0001348693499587421, + "loss": 0.8589, + "mean_token_accuracy": 0.7421862840652466, + "num_tokens": 82127545.0, + "step": 35520 + }, + { + "epoch": 0.3257541028697167, + "learning_rate": 0.00013485101311084624, + "loss": 0.8176, + "mean_token_accuracy": 0.7536823272705078, + "num_tokens": 82150812.0, + "step": 35530 + }, + { + "epoch": 0.32584578710919593, + "learning_rate": 0.0001348326762629504, + "loss": 0.843, + "mean_token_accuracy": 0.7387829601764679, + "num_tokens": 82174944.0, + "step": 35540 + }, + { + "epoch": 0.3259374713486752, + "learning_rate": 0.00013481433941505457, + "loss": 0.8474, + "mean_token_accuracy": 0.7454278707504273, + "num_tokens": 82197846.0, + "step": 35550 + }, + { + "epoch": 0.3260291555881544, + "learning_rate": 0.0001347960025671587, + "loss": 0.848, + "mean_token_accuracy": 0.7468889653682709, + "num_tokens": 82221244.0, + "step": 35560 + }, + { + "epoch": 0.3261208398276336, + "learning_rate": 0.00013477766571926288, + "loss": 0.8299, + "mean_token_accuracy": 0.7487314581871033, + "num_tokens": 82244019.0, + "step": 35570 + }, + { + "epoch": 0.3262125240671129, + "learning_rate": 0.00013475932887136702, + "loss": 0.9003, + "mean_token_accuracy": 0.7275493264198303, + "num_tokens": 82267283.0, + "step": 35580 + }, + { + "epoch": 0.32630420830659207, + "learning_rate": 0.00013474099202347116, + "loss": 0.8805, + "mean_token_accuracy": 0.736548376083374, + "num_tokens": 82290406.0, + "step": 35590 + }, + { + "epoch": 0.3263958925460713, + "learning_rate": 0.00013472265517557532, + "loss": 0.8571, + "mean_token_accuracy": 0.7379210770130158, + "num_tokens": 82313558.0, + "step": 35600 + }, + { + "epoch": 0.32648757678555057, + "learning_rate": 0.00013470431832767946, + "loss": 0.8441, + "mean_token_accuracy": 0.7455053985118866, + "num_tokens": 82335906.0, + "step": 35610 + }, + { + "epoch": 0.3265792610250298, + "learning_rate": 0.00013468598147978365, + "loss": 0.8212, + "mean_token_accuracy": 0.7589194655418396, + "num_tokens": 82358530.0, + "step": 35620 + }, + { + "epoch": 0.326670945264509, + "learning_rate": 0.0001346676446318878, + "loss": 0.8665, + "mean_token_accuracy": 0.7412411212921143, + "num_tokens": 82382048.0, + "step": 35630 + }, + { + "epoch": 0.32676262950398827, + "learning_rate": 0.00013464930778399193, + "loss": 0.838, + "mean_token_accuracy": 0.7476840674877167, + "num_tokens": 82404846.0, + "step": 35640 + }, + { + "epoch": 0.3268543137434675, + "learning_rate": 0.0001346309709360961, + "loss": 0.8966, + "mean_token_accuracy": 0.7345963656902313, + "num_tokens": 82427674.0, + "step": 35650 + }, + { + "epoch": 0.3269459979829467, + "learning_rate": 0.00013461263408820023, + "loss": 0.8015, + "mean_token_accuracy": 0.75493882894516, + "num_tokens": 82450146.0, + "step": 35660 + }, + { + "epoch": 0.32703768222242596, + "learning_rate": 0.0001345942972403044, + "loss": 0.8497, + "mean_token_accuracy": 0.7464676558971405, + "num_tokens": 82472582.0, + "step": 35670 + }, + { + "epoch": 0.3271293664619052, + "learning_rate": 0.00013457596039240856, + "loss": 0.8427, + "mean_token_accuracy": 0.7504710197448731, + "num_tokens": 82495685.0, + "step": 35680 + }, + { + "epoch": 0.3272210507013844, + "learning_rate": 0.0001345576235445127, + "loss": 0.8464, + "mean_token_accuracy": 0.7482772767543793, + "num_tokens": 82518711.0, + "step": 35690 + }, + { + "epoch": 0.32731273494086366, + "learning_rate": 0.00013453928669661687, + "loss": 0.8652, + "mean_token_accuracy": 0.7443857192993164, + "num_tokens": 82541345.0, + "step": 35700 + }, + { + "epoch": 0.3274044191803429, + "learning_rate": 0.000134520949848721, + "loss": 0.8553, + "mean_token_accuracy": 0.7438439548015594, + "num_tokens": 82563974.0, + "step": 35710 + }, + { + "epoch": 0.32749610341982216, + "learning_rate": 0.00013450261300082517, + "loss": 0.8499, + "mean_token_accuracy": 0.7503586053848267, + "num_tokens": 82587554.0, + "step": 35720 + }, + { + "epoch": 0.32758778765930135, + "learning_rate": 0.0001344842761529293, + "loss": 0.8833, + "mean_token_accuracy": 0.739331042766571, + "num_tokens": 82610042.0, + "step": 35730 + }, + { + "epoch": 0.3276794718987806, + "learning_rate": 0.00013446593930503347, + "loss": 0.8032, + "mean_token_accuracy": 0.7542295634746552, + "num_tokens": 82633565.0, + "step": 35740 + }, + { + "epoch": 0.32777115613825986, + "learning_rate": 0.00013444760245713764, + "loss": 0.878, + "mean_token_accuracy": 0.7337488234043121, + "num_tokens": 82656625.0, + "step": 35750 + }, + { + "epoch": 0.32786284037773905, + "learning_rate": 0.00013442926560924178, + "loss": 0.8909, + "mean_token_accuracy": 0.7295827150344849, + "num_tokens": 82679780.0, + "step": 35760 + }, + { + "epoch": 0.3279545246172183, + "learning_rate": 0.00013441092876134594, + "loss": 0.8363, + "mean_token_accuracy": 0.7473319292068481, + "num_tokens": 82704065.0, + "step": 35770 + }, + { + "epoch": 0.32804620885669755, + "learning_rate": 0.00013439259191345008, + "loss": 0.8143, + "mean_token_accuracy": 0.7503743290901184, + "num_tokens": 82727035.0, + "step": 35780 + }, + { + "epoch": 0.32813789309617675, + "learning_rate": 0.00013437425506555422, + "loss": 0.8387, + "mean_token_accuracy": 0.755956894159317, + "num_tokens": 82750698.0, + "step": 35790 + }, + { + "epoch": 0.328229577335656, + "learning_rate": 0.00013435591821765839, + "loss": 0.8515, + "mean_token_accuracy": 0.7519905805587769, + "num_tokens": 82773181.0, + "step": 35800 + }, + { + "epoch": 0.32832126157513525, + "learning_rate": 0.00013433758136976255, + "loss": 0.8463, + "mean_token_accuracy": 0.7504700422286987, + "num_tokens": 82796677.0, + "step": 35810 + }, + { + "epoch": 0.32841294581461444, + "learning_rate": 0.00013431924452186672, + "loss": 0.8313, + "mean_token_accuracy": 0.7485404849052429, + "num_tokens": 82820405.0, + "step": 35820 + }, + { + "epoch": 0.3285046300540937, + "learning_rate": 0.00013430090767397085, + "loss": 0.8598, + "mean_token_accuracy": 0.7402553975582122, + "num_tokens": 82844118.0, + "step": 35830 + }, + { + "epoch": 0.32859631429357294, + "learning_rate": 0.000134282570826075, + "loss": 0.8349, + "mean_token_accuracy": 0.7491594135761261, + "num_tokens": 82867156.0, + "step": 35840 + }, + { + "epoch": 0.3286879985330522, + "learning_rate": 0.00013426423397817916, + "loss": 0.8042, + "mean_token_accuracy": 0.7536715269088745, + "num_tokens": 82889919.0, + "step": 35850 + }, + { + "epoch": 0.3287796827725314, + "learning_rate": 0.0001342458971302833, + "loss": 0.8796, + "mean_token_accuracy": 0.7440406084060669, + "num_tokens": 82913503.0, + "step": 35860 + }, + { + "epoch": 0.32887136701201064, + "learning_rate": 0.00013422756028238746, + "loss": 0.8564, + "mean_token_accuracy": 0.7469022214412689, + "num_tokens": 82936700.0, + "step": 35870 + }, + { + "epoch": 0.3289630512514899, + "learning_rate": 0.00013420922343449163, + "loss": 0.8166, + "mean_token_accuracy": 0.7591893672943115, + "num_tokens": 82959989.0, + "step": 35880 + }, + { + "epoch": 0.3290547354909691, + "learning_rate": 0.00013419088658659577, + "loss": 0.8533, + "mean_token_accuracy": 0.7430768609046936, + "num_tokens": 82982688.0, + "step": 35890 + }, + { + "epoch": 0.32914641973044834, + "learning_rate": 0.00013417254973869993, + "loss": 0.8211, + "mean_token_accuracy": 0.7535585284233093, + "num_tokens": 83004976.0, + "step": 35900 + }, + { + "epoch": 0.3292381039699276, + "learning_rate": 0.00013415421289080407, + "loss": 0.8587, + "mean_token_accuracy": 0.7439225792884827, + "num_tokens": 83028886.0, + "step": 35910 + }, + { + "epoch": 0.3293297882094068, + "learning_rate": 0.00013413587604290823, + "loss": 0.8806, + "mean_token_accuracy": 0.7404143691062928, + "num_tokens": 83051375.0, + "step": 35920 + }, + { + "epoch": 0.32942147244888603, + "learning_rate": 0.00013411753919501237, + "loss": 0.8078, + "mean_token_accuracy": 0.7531822741031646, + "num_tokens": 83075443.0, + "step": 35930 + }, + { + "epoch": 0.3295131566883653, + "learning_rate": 0.00013409920234711654, + "loss": 0.8464, + "mean_token_accuracy": 0.7476143658161163, + "num_tokens": 83097861.0, + "step": 35940 + }, + { + "epoch": 0.3296048409278445, + "learning_rate": 0.0001340808654992207, + "loss": 0.8668, + "mean_token_accuracy": 0.7435589492321014, + "num_tokens": 83121036.0, + "step": 35950 + }, + { + "epoch": 0.32969652516732373, + "learning_rate": 0.00013406252865132484, + "loss": 0.8407, + "mean_token_accuracy": 0.7459194183349609, + "num_tokens": 83144332.0, + "step": 35960 + }, + { + "epoch": 0.329788209406803, + "learning_rate": 0.000134044191803429, + "loss": 0.8256, + "mean_token_accuracy": 0.752760899066925, + "num_tokens": 83168003.0, + "step": 35970 + }, + { + "epoch": 0.32987989364628223, + "learning_rate": 0.00013402585495553315, + "loss": 0.8251, + "mean_token_accuracy": 0.7474977254867554, + "num_tokens": 83191122.0, + "step": 35980 + }, + { + "epoch": 0.3299715778857614, + "learning_rate": 0.00013400751810763728, + "loss": 0.8246, + "mean_token_accuracy": 0.7548482060432434, + "num_tokens": 83214237.0, + "step": 35990 + }, + { + "epoch": 0.3300632621252407, + "learning_rate": 0.00013398918125974145, + "loss": 0.8481, + "mean_token_accuracy": 0.7422476232051849, + "num_tokens": 83237553.0, + "step": 36000 + }, + { + "epoch": 0.3301549463647199, + "learning_rate": 0.00013397084441184562, + "loss": 0.86, + "mean_token_accuracy": 0.7420591831207275, + "num_tokens": 83261411.0, + "step": 36010 + }, + { + "epoch": 0.3302466306041991, + "learning_rate": 0.00013395250756394978, + "loss": 0.8796, + "mean_token_accuracy": 0.7426454842090606, + "num_tokens": 83284089.0, + "step": 36020 + }, + { + "epoch": 0.33033831484367837, + "learning_rate": 0.00013393417071605392, + "loss": 0.8342, + "mean_token_accuracy": 0.7506460428237915, + "num_tokens": 83306866.0, + "step": 36030 + }, + { + "epoch": 0.3304299990831576, + "learning_rate": 0.00013391583386815806, + "loss": 0.8875, + "mean_token_accuracy": 0.733001071214676, + "num_tokens": 83329752.0, + "step": 36040 + }, + { + "epoch": 0.3305216833226368, + "learning_rate": 0.00013389749702026222, + "loss": 0.8664, + "mean_token_accuracy": 0.748653793334961, + "num_tokens": 83353323.0, + "step": 36050 + }, + { + "epoch": 0.33061336756211607, + "learning_rate": 0.00013387916017236636, + "loss": 0.8249, + "mean_token_accuracy": 0.7484886705875397, + "num_tokens": 83376495.0, + "step": 36060 + }, + { + "epoch": 0.3307050518015953, + "learning_rate": 0.00013386082332447053, + "loss": 0.8446, + "mean_token_accuracy": 0.7476909399032593, + "num_tokens": 83399869.0, + "step": 36070 + }, + { + "epoch": 0.3307967360410745, + "learning_rate": 0.0001338424864765747, + "loss": 0.8113, + "mean_token_accuracy": 0.7545444250106812, + "num_tokens": 83422697.0, + "step": 36080 + }, + { + "epoch": 0.33088842028055376, + "learning_rate": 0.00013382414962867883, + "loss": 0.8669, + "mean_token_accuracy": 0.7394547402858734, + "num_tokens": 83445919.0, + "step": 36090 + }, + { + "epoch": 0.330980104520033, + "learning_rate": 0.000133805812780783, + "loss": 0.8522, + "mean_token_accuracy": 0.7406936287879944, + "num_tokens": 83469760.0, + "step": 36100 + }, + { + "epoch": 0.33107178875951226, + "learning_rate": 0.00013378747593288713, + "loss": 0.8207, + "mean_token_accuracy": 0.7470863163471222, + "num_tokens": 83491764.0, + "step": 36110 + }, + { + "epoch": 0.33116347299899146, + "learning_rate": 0.0001337691390849913, + "loss": 0.8272, + "mean_token_accuracy": 0.7513814866542816, + "num_tokens": 83514568.0, + "step": 36120 + }, + { + "epoch": 0.3312551572384707, + "learning_rate": 0.00013375080223709544, + "loss": 0.846, + "mean_token_accuracy": 0.7450028181076049, + "num_tokens": 83536772.0, + "step": 36130 + }, + { + "epoch": 0.33134684147794996, + "learning_rate": 0.0001337324653891996, + "loss": 0.8695, + "mean_token_accuracy": 0.7432056784629821, + "num_tokens": 83559175.0, + "step": 36140 + }, + { + "epoch": 0.33143852571742916, + "learning_rate": 0.00013371412854130377, + "loss": 0.8098, + "mean_token_accuracy": 0.7504313349723816, + "num_tokens": 83581727.0, + "step": 36150 + }, + { + "epoch": 0.3315302099569084, + "learning_rate": 0.0001336957916934079, + "loss": 0.8428, + "mean_token_accuracy": 0.7397641062736511, + "num_tokens": 83605865.0, + "step": 36160 + }, + { + "epoch": 0.33162189419638766, + "learning_rate": 0.00013367745484551207, + "loss": 0.8529, + "mean_token_accuracy": 0.7477608442306518, + "num_tokens": 83629565.0, + "step": 36170 + }, + { + "epoch": 0.33171357843586685, + "learning_rate": 0.0001336591179976162, + "loss": 0.8611, + "mean_token_accuracy": 0.7459795713424683, + "num_tokens": 83651876.0, + "step": 36180 + }, + { + "epoch": 0.3318052626753461, + "learning_rate": 0.00013364078114972035, + "loss": 0.8345, + "mean_token_accuracy": 0.7443089842796325, + "num_tokens": 83674656.0, + "step": 36190 + }, + { + "epoch": 0.33189694691482535, + "learning_rate": 0.00013362244430182451, + "loss": 0.8757, + "mean_token_accuracy": 0.7393298149108887, + "num_tokens": 83697678.0, + "step": 36200 + }, + { + "epoch": 0.33198863115430455, + "learning_rate": 0.00013360410745392868, + "loss": 0.8946, + "mean_token_accuracy": 0.7454830348491669, + "num_tokens": 83720947.0, + "step": 36210 + }, + { + "epoch": 0.3320803153937838, + "learning_rate": 0.00013358577060603284, + "loss": 0.8145, + "mean_token_accuracy": 0.7509842216968536, + "num_tokens": 83743924.0, + "step": 36220 + }, + { + "epoch": 0.33217199963326305, + "learning_rate": 0.00013356743375813698, + "loss": 0.8559, + "mean_token_accuracy": 0.7424210250377655, + "num_tokens": 83767174.0, + "step": 36230 + }, + { + "epoch": 0.3322636838727423, + "learning_rate": 0.00013354909691024112, + "loss": 0.8657, + "mean_token_accuracy": 0.7500545799732208, + "num_tokens": 83789080.0, + "step": 36240 + }, + { + "epoch": 0.3323553681122215, + "learning_rate": 0.0001335307600623453, + "loss": 0.8638, + "mean_token_accuracy": 0.7432078897953034, + "num_tokens": 83812054.0, + "step": 36250 + }, + { + "epoch": 0.33244705235170074, + "learning_rate": 0.00013351242321444943, + "loss": 0.8577, + "mean_token_accuracy": 0.7478015542030334, + "num_tokens": 83834880.0, + "step": 36260 + }, + { + "epoch": 0.33253873659118, + "learning_rate": 0.00013349408636655362, + "loss": 0.8484, + "mean_token_accuracy": 0.7472139954566955, + "num_tokens": 83858308.0, + "step": 36270 + }, + { + "epoch": 0.3326304208306592, + "learning_rate": 0.00013347574951865776, + "loss": 0.85, + "mean_token_accuracy": 0.7430963695049286, + "num_tokens": 83881817.0, + "step": 36280 + }, + { + "epoch": 0.33272210507013844, + "learning_rate": 0.0001334574126707619, + "loss": 0.8463, + "mean_token_accuracy": 0.7436040818691254, + "num_tokens": 83905127.0, + "step": 36290 + }, + { + "epoch": 0.3328137893096177, + "learning_rate": 0.00013343907582286606, + "loss": 0.8588, + "mean_token_accuracy": 0.7438998699188233, + "num_tokens": 83927600.0, + "step": 36300 + }, + { + "epoch": 0.3329054735490969, + "learning_rate": 0.0001334207389749702, + "loss": 0.8501, + "mean_token_accuracy": 0.7480362892150879, + "num_tokens": 83950550.0, + "step": 36310 + }, + { + "epoch": 0.33299715778857614, + "learning_rate": 0.00013340240212707436, + "loss": 0.8317, + "mean_token_accuracy": 0.752432930469513, + "num_tokens": 83973474.0, + "step": 36320 + }, + { + "epoch": 0.3330888420280554, + "learning_rate": 0.0001333840652791785, + "loss": 0.8488, + "mean_token_accuracy": 0.7455214023590088, + "num_tokens": 83996424.0, + "step": 36330 + }, + { + "epoch": 0.33318052626753464, + "learning_rate": 0.00013336572843128267, + "loss": 0.859, + "mean_token_accuracy": 0.7452872037887573, + "num_tokens": 84019412.0, + "step": 36340 + }, + { + "epoch": 0.33327221050701383, + "learning_rate": 0.00013334739158338683, + "loss": 0.8098, + "mean_token_accuracy": 0.756863534450531, + "num_tokens": 84042655.0, + "step": 36350 + }, + { + "epoch": 0.3333638947464931, + "learning_rate": 0.00013332905473549097, + "loss": 0.8562, + "mean_token_accuracy": 0.7415922701358795, + "num_tokens": 84066406.0, + "step": 36360 + }, + { + "epoch": 0.33345557898597233, + "learning_rate": 0.00013331071788759514, + "loss": 0.8106, + "mean_token_accuracy": 0.7486303687095642, + "num_tokens": 84090247.0, + "step": 36370 + }, + { + "epoch": 0.33354726322545153, + "learning_rate": 0.00013329238103969927, + "loss": 0.8572, + "mean_token_accuracy": 0.740035605430603, + "num_tokens": 84113829.0, + "step": 36380 + }, + { + "epoch": 0.3336389474649308, + "learning_rate": 0.0001332740441918034, + "loss": 0.8345, + "mean_token_accuracy": 0.7442825198173523, + "num_tokens": 84137550.0, + "step": 36390 + }, + { + "epoch": 0.33373063170441003, + "learning_rate": 0.0001332557073439076, + "loss": 0.872, + "mean_token_accuracy": 0.7430775403976441, + "num_tokens": 84159965.0, + "step": 36400 + }, + { + "epoch": 0.3338223159438892, + "learning_rate": 0.00013323737049601174, + "loss": 0.8291, + "mean_token_accuracy": 0.7472260773181916, + "num_tokens": 84183451.0, + "step": 36410 + }, + { + "epoch": 0.3339140001833685, + "learning_rate": 0.0001332190336481159, + "loss": 0.8245, + "mean_token_accuracy": 0.7508554220199585, + "num_tokens": 84206829.0, + "step": 36420 + }, + { + "epoch": 0.3340056844228477, + "learning_rate": 0.00013320069680022005, + "loss": 0.852, + "mean_token_accuracy": 0.7439524888992309, + "num_tokens": 84229964.0, + "step": 36430 + }, + { + "epoch": 0.3340973686623269, + "learning_rate": 0.00013318235995232419, + "loss": 0.8965, + "mean_token_accuracy": 0.7367576241493226, + "num_tokens": 84252935.0, + "step": 36440 + }, + { + "epoch": 0.33418905290180617, + "learning_rate": 0.00013316402310442835, + "loss": 0.8265, + "mean_token_accuracy": 0.744022423028946, + "num_tokens": 84276312.0, + "step": 36450 + }, + { + "epoch": 0.3342807371412854, + "learning_rate": 0.0001331456862565325, + "loss": 0.8534, + "mean_token_accuracy": 0.7482629716396332, + "num_tokens": 84299175.0, + "step": 36460 + }, + { + "epoch": 0.3343724213807647, + "learning_rate": 0.00013312734940863668, + "loss": 0.8202, + "mean_token_accuracy": 0.7586467385292053, + "num_tokens": 84322218.0, + "step": 36470 + }, + { + "epoch": 0.33446410562024387, + "learning_rate": 0.00013310901256074082, + "loss": 0.8985, + "mean_token_accuracy": 0.7379003882408142, + "num_tokens": 84344952.0, + "step": 36480 + }, + { + "epoch": 0.3345557898597231, + "learning_rate": 0.00013309067571284496, + "loss": 0.8638, + "mean_token_accuracy": 0.7478548049926758, + "num_tokens": 84368107.0, + "step": 36490 + }, + { + "epoch": 0.33464747409920237, + "learning_rate": 0.00013307233886494912, + "loss": 0.8743, + "mean_token_accuracy": 0.7421445190906525, + "num_tokens": 84391482.0, + "step": 36500 + }, + { + "epoch": 0.33473915833868156, + "learning_rate": 0.00013305400201705326, + "loss": 0.8836, + "mean_token_accuracy": 0.7406928241252899, + "num_tokens": 84414405.0, + "step": 36510 + }, + { + "epoch": 0.3348308425781608, + "learning_rate": 0.00013303566516915743, + "loss": 0.8516, + "mean_token_accuracy": 0.7462628364562989, + "num_tokens": 84437923.0, + "step": 36520 + }, + { + "epoch": 0.33492252681764006, + "learning_rate": 0.0001330173283212616, + "loss": 0.85, + "mean_token_accuracy": 0.7484513282775879, + "num_tokens": 84460627.0, + "step": 36530 + }, + { + "epoch": 0.33501421105711926, + "learning_rate": 0.00013299899147336573, + "loss": 0.8863, + "mean_token_accuracy": 0.7424584090709686, + "num_tokens": 84483322.0, + "step": 36540 + }, + { + "epoch": 0.3351058952965985, + "learning_rate": 0.0001329806546254699, + "loss": 0.8841, + "mean_token_accuracy": 0.7359366238117218, + "num_tokens": 84505527.0, + "step": 36550 + }, + { + "epoch": 0.33519757953607776, + "learning_rate": 0.00013296231777757404, + "loss": 0.8393, + "mean_token_accuracy": 0.7437104701995849, + "num_tokens": 84529547.0, + "step": 36560 + }, + { + "epoch": 0.33528926377555696, + "learning_rate": 0.0001329439809296782, + "loss": 0.8602, + "mean_token_accuracy": 0.7423426568508148, + "num_tokens": 84552247.0, + "step": 36570 + }, + { + "epoch": 0.3353809480150362, + "learning_rate": 0.00013292564408178234, + "loss": 0.873, + "mean_token_accuracy": 0.738763564825058, + "num_tokens": 84574062.0, + "step": 36580 + }, + { + "epoch": 0.33547263225451546, + "learning_rate": 0.00013290730723388648, + "loss": 0.8632, + "mean_token_accuracy": 0.7434098660945893, + "num_tokens": 84597243.0, + "step": 36590 + }, + { + "epoch": 0.3355643164939947, + "learning_rate": 0.00013288897038599067, + "loss": 0.8427, + "mean_token_accuracy": 0.7464635312557221, + "num_tokens": 84619817.0, + "step": 36600 + }, + { + "epoch": 0.3356560007334739, + "learning_rate": 0.0001328706335380948, + "loss": 0.8464, + "mean_token_accuracy": 0.7427412450313569, + "num_tokens": 84642830.0, + "step": 36610 + }, + { + "epoch": 0.33574768497295315, + "learning_rate": 0.00013285229669019897, + "loss": 0.8609, + "mean_token_accuracy": 0.747695368528366, + "num_tokens": 84665975.0, + "step": 36620 + }, + { + "epoch": 0.3358393692124324, + "learning_rate": 0.0001328339598423031, + "loss": 0.8137, + "mean_token_accuracy": 0.750172358751297, + "num_tokens": 84688862.0, + "step": 36630 + }, + { + "epoch": 0.3359310534519116, + "learning_rate": 0.00013281562299440725, + "loss": 0.8433, + "mean_token_accuracy": 0.7464560210704804, + "num_tokens": 84711845.0, + "step": 36640 + }, + { + "epoch": 0.33602273769139085, + "learning_rate": 0.00013279728614651142, + "loss": 0.8554, + "mean_token_accuracy": 0.7443154096603394, + "num_tokens": 84735577.0, + "step": 36650 + }, + { + "epoch": 0.3361144219308701, + "learning_rate": 0.00013277894929861558, + "loss": 0.8332, + "mean_token_accuracy": 0.7442899823188782, + "num_tokens": 84758130.0, + "step": 36660 + }, + { + "epoch": 0.3362061061703493, + "learning_rate": 0.00013276061245071975, + "loss": 0.863, + "mean_token_accuracy": 0.7436336934566498, + "num_tokens": 84781808.0, + "step": 36670 + }, + { + "epoch": 0.33629779040982855, + "learning_rate": 0.00013274227560282389, + "loss": 0.8614, + "mean_token_accuracy": 0.7438279747962951, + "num_tokens": 84804876.0, + "step": 36680 + }, + { + "epoch": 0.3363894746493078, + "learning_rate": 0.00013272393875492802, + "loss": 0.8524, + "mean_token_accuracy": 0.7418655335903168, + "num_tokens": 84828253.0, + "step": 36690 + }, + { + "epoch": 0.336481158888787, + "learning_rate": 0.0001327056019070322, + "loss": 0.8481, + "mean_token_accuracy": 0.7425264775753021, + "num_tokens": 84852049.0, + "step": 36700 + }, + { + "epoch": 0.33657284312826624, + "learning_rate": 0.00013268726505913633, + "loss": 0.8949, + "mean_token_accuracy": 0.7352565705776215, + "num_tokens": 84874657.0, + "step": 36710 + }, + { + "epoch": 0.3366645273677455, + "learning_rate": 0.0001326689282112405, + "loss": 0.8674, + "mean_token_accuracy": 0.7446515262126923, + "num_tokens": 84897173.0, + "step": 36720 + }, + { + "epoch": 0.33675621160722474, + "learning_rate": 0.00013265059136334466, + "loss": 0.8592, + "mean_token_accuracy": 0.7412495791912079, + "num_tokens": 84920633.0, + "step": 36730 + }, + { + "epoch": 0.33684789584670394, + "learning_rate": 0.0001326322545154488, + "loss": 0.8179, + "mean_token_accuracy": 0.7505267918109894, + "num_tokens": 84943480.0, + "step": 36740 + }, + { + "epoch": 0.3369395800861832, + "learning_rate": 0.00013261391766755296, + "loss": 0.8415, + "mean_token_accuracy": 0.7481511950492858, + "num_tokens": 84966045.0, + "step": 36750 + }, + { + "epoch": 0.33703126432566244, + "learning_rate": 0.0001325955808196571, + "loss": 0.8725, + "mean_token_accuracy": 0.7443264424800873, + "num_tokens": 84988586.0, + "step": 36760 + }, + { + "epoch": 0.33712294856514163, + "learning_rate": 0.00013257724397176127, + "loss": 0.8471, + "mean_token_accuracy": 0.747825825214386, + "num_tokens": 85011896.0, + "step": 36770 + }, + { + "epoch": 0.3372146328046209, + "learning_rate": 0.0001325589071238654, + "loss": 0.8326, + "mean_token_accuracy": 0.7540049493312836, + "num_tokens": 85035434.0, + "step": 36780 + }, + { + "epoch": 0.33730631704410013, + "learning_rate": 0.00013254057027596957, + "loss": 0.8405, + "mean_token_accuracy": 0.7456261396408081, + "num_tokens": 85058819.0, + "step": 36790 + }, + { + "epoch": 0.33739800128357933, + "learning_rate": 0.00013252223342807373, + "loss": 0.8358, + "mean_token_accuracy": 0.751392924785614, + "num_tokens": 85082363.0, + "step": 36800 + }, + { + "epoch": 0.3374896855230586, + "learning_rate": 0.00013250389658017787, + "loss": 0.8498, + "mean_token_accuracy": 0.7476738095283508, + "num_tokens": 85104936.0, + "step": 36810 + }, + { + "epoch": 0.33758136976253783, + "learning_rate": 0.00013248555973228204, + "loss": 0.8606, + "mean_token_accuracy": 0.7451462864875793, + "num_tokens": 85128653.0, + "step": 36820 + }, + { + "epoch": 0.337673054002017, + "learning_rate": 0.00013246722288438618, + "loss": 0.8561, + "mean_token_accuracy": 0.7442201793193817, + "num_tokens": 85151880.0, + "step": 36830 + }, + { + "epoch": 0.3377647382414963, + "learning_rate": 0.00013244888603649031, + "loss": 0.8735, + "mean_token_accuracy": 0.7356188356876373, + "num_tokens": 85174037.0, + "step": 36840 + }, + { + "epoch": 0.3378564224809755, + "learning_rate": 0.00013243054918859448, + "loss": 0.8309, + "mean_token_accuracy": 0.75159912109375, + "num_tokens": 85198024.0, + "step": 36850 + }, + { + "epoch": 0.3379481067204548, + "learning_rate": 0.00013241221234069865, + "loss": 0.8691, + "mean_token_accuracy": 0.7484756886959076, + "num_tokens": 85220739.0, + "step": 36860 + }, + { + "epoch": 0.338039790959934, + "learning_rate": 0.0001323938754928028, + "loss": 0.8399, + "mean_token_accuracy": 0.7407955288887024, + "num_tokens": 85243291.0, + "step": 36870 + }, + { + "epoch": 0.3381314751994132, + "learning_rate": 0.00013237553864490695, + "loss": 0.8664, + "mean_token_accuracy": 0.7445390164852143, + "num_tokens": 85266951.0, + "step": 36880 + }, + { + "epoch": 0.3382231594388925, + "learning_rate": 0.0001323572017970111, + "loss": 0.8243, + "mean_token_accuracy": 0.7566348731517791, + "num_tokens": 85290143.0, + "step": 36890 + }, + { + "epoch": 0.33831484367837167, + "learning_rate": 0.00013233886494911525, + "loss": 0.8397, + "mean_token_accuracy": 0.7452965676784515, + "num_tokens": 85312440.0, + "step": 36900 + }, + { + "epoch": 0.3384065279178509, + "learning_rate": 0.0001323205281012194, + "loss": 0.8679, + "mean_token_accuracy": 0.7389244675636292, + "num_tokens": 85335363.0, + "step": 36910 + }, + { + "epoch": 0.33849821215733017, + "learning_rate": 0.00013230219125332358, + "loss": 0.8272, + "mean_token_accuracy": 0.7493228614330292, + "num_tokens": 85358520.0, + "step": 36920 + }, + { + "epoch": 0.33858989639680936, + "learning_rate": 0.00013228385440542772, + "loss": 0.8919, + "mean_token_accuracy": 0.7353790402412415, + "num_tokens": 85381886.0, + "step": 36930 + }, + { + "epoch": 0.3386815806362886, + "learning_rate": 0.00013226551755753186, + "loss": 0.833, + "mean_token_accuracy": 0.7530224323272705, + "num_tokens": 85405009.0, + "step": 36940 + }, + { + "epoch": 0.33877326487576787, + "learning_rate": 0.00013224718070963603, + "loss": 0.8832, + "mean_token_accuracy": 0.7367229163646698, + "num_tokens": 85428120.0, + "step": 36950 + }, + { + "epoch": 0.3388649491152471, + "learning_rate": 0.00013222884386174016, + "loss": 0.8951, + "mean_token_accuracy": 0.7369018435478211, + "num_tokens": 85451075.0, + "step": 36960 + }, + { + "epoch": 0.3389566333547263, + "learning_rate": 0.00013221050701384433, + "loss": 0.8685, + "mean_token_accuracy": 0.7381076693534852, + "num_tokens": 85474371.0, + "step": 36970 + }, + { + "epoch": 0.33904831759420556, + "learning_rate": 0.00013219217016594847, + "loss": 0.8571, + "mean_token_accuracy": 0.7486586391925811, + "num_tokens": 85497716.0, + "step": 36980 + }, + { + "epoch": 0.3391400018336848, + "learning_rate": 0.00013217383331805263, + "loss": 0.8252, + "mean_token_accuracy": 0.7552816092967987, + "num_tokens": 85520387.0, + "step": 36990 + }, + { + "epoch": 0.339231686073164, + "learning_rate": 0.0001321554964701568, + "loss": 0.8121, + "mean_token_accuracy": 0.7532137870788574, + "num_tokens": 85543418.0, + "step": 37000 + }, + { + "epoch": 0.33932337031264326, + "learning_rate": 0.00013213715962226094, + "loss": 0.8275, + "mean_token_accuracy": 0.7536680340766907, + "num_tokens": 85567146.0, + "step": 37010 + }, + { + "epoch": 0.3394150545521225, + "learning_rate": 0.0001321188227743651, + "loss": 0.8708, + "mean_token_accuracy": 0.740613979101181, + "num_tokens": 85590525.0, + "step": 37020 + }, + { + "epoch": 0.3395067387916017, + "learning_rate": 0.00013210048592646924, + "loss": 0.8343, + "mean_token_accuracy": 0.7506062805652618, + "num_tokens": 85612864.0, + "step": 37030 + }, + { + "epoch": 0.33959842303108095, + "learning_rate": 0.00013208214907857338, + "loss": 0.8686, + "mean_token_accuracy": 0.7389248132705688, + "num_tokens": 85636267.0, + "step": 37040 + }, + { + "epoch": 0.3396901072705602, + "learning_rate": 0.00013206381223067757, + "loss": 0.8317, + "mean_token_accuracy": 0.7465624272823334, + "num_tokens": 85659474.0, + "step": 37050 + }, + { + "epoch": 0.3397817915100394, + "learning_rate": 0.0001320454753827817, + "loss": 0.8035, + "mean_token_accuracy": 0.757887351512909, + "num_tokens": 85683234.0, + "step": 37060 + }, + { + "epoch": 0.33987347574951865, + "learning_rate": 0.00013202713853488588, + "loss": 0.8781, + "mean_token_accuracy": 0.7341601371765136, + "num_tokens": 85707234.0, + "step": 37070 + }, + { + "epoch": 0.3399651599889979, + "learning_rate": 0.00013200880168699001, + "loss": 0.8493, + "mean_token_accuracy": 0.744634622335434, + "num_tokens": 85729868.0, + "step": 37080 + }, + { + "epoch": 0.34005684422847715, + "learning_rate": 0.00013199046483909415, + "loss": 0.8351, + "mean_token_accuracy": 0.7524881303310395, + "num_tokens": 85752871.0, + "step": 37090 + }, + { + "epoch": 0.34014852846795635, + "learning_rate": 0.00013197212799119832, + "loss": 0.8437, + "mean_token_accuracy": 0.7475317716598511, + "num_tokens": 85776016.0, + "step": 37100 + }, + { + "epoch": 0.3402402127074356, + "learning_rate": 0.00013195379114330246, + "loss": 0.836, + "mean_token_accuracy": 0.7491052448749542, + "num_tokens": 85799713.0, + "step": 37110 + }, + { + "epoch": 0.34033189694691485, + "learning_rate": 0.00013193545429540665, + "loss": 0.8614, + "mean_token_accuracy": 0.7442010939121246, + "num_tokens": 85822017.0, + "step": 37120 + }, + { + "epoch": 0.34042358118639404, + "learning_rate": 0.0001319171174475108, + "loss": 0.8389, + "mean_token_accuracy": 0.7481133580207825, + "num_tokens": 85845360.0, + "step": 37130 + }, + { + "epoch": 0.3405152654258733, + "learning_rate": 0.00013189878059961493, + "loss": 0.8417, + "mean_token_accuracy": 0.7507116019725799, + "num_tokens": 85868020.0, + "step": 37140 + }, + { + "epoch": 0.34060694966535254, + "learning_rate": 0.0001318804437517191, + "loss": 0.8615, + "mean_token_accuracy": 0.7394050121307373, + "num_tokens": 85891078.0, + "step": 37150 + }, + { + "epoch": 0.34069863390483174, + "learning_rate": 0.00013186210690382323, + "loss": 0.8666, + "mean_token_accuracy": 0.7420512437820435, + "num_tokens": 85914547.0, + "step": 37160 + }, + { + "epoch": 0.340790318144311, + "learning_rate": 0.0001318437700559274, + "loss": 0.8293, + "mean_token_accuracy": 0.7506530165672303, + "num_tokens": 85937453.0, + "step": 37170 + }, + { + "epoch": 0.34088200238379024, + "learning_rate": 0.00013182543320803153, + "loss": 0.8252, + "mean_token_accuracy": 0.7584544062614441, + "num_tokens": 85960622.0, + "step": 37180 + }, + { + "epoch": 0.34097368662326943, + "learning_rate": 0.0001318070963601357, + "loss": 0.8418, + "mean_token_accuracy": 0.7440663695335388, + "num_tokens": 85984150.0, + "step": 37190 + }, + { + "epoch": 0.3410653708627487, + "learning_rate": 0.00013178875951223986, + "loss": 0.8015, + "mean_token_accuracy": 0.7545207738876343, + "num_tokens": 86006654.0, + "step": 37200 + }, + { + "epoch": 0.34115705510222794, + "learning_rate": 0.000131770422664344, + "loss": 0.8287, + "mean_token_accuracy": 0.745617938041687, + "num_tokens": 86029823.0, + "step": 37210 + }, + { + "epoch": 0.3412487393417072, + "learning_rate": 0.00013175208581644817, + "loss": 0.8011, + "mean_token_accuracy": 0.7545137763023376, + "num_tokens": 86053544.0, + "step": 37220 + }, + { + "epoch": 0.3413404235811864, + "learning_rate": 0.0001317337489685523, + "loss": 0.8584, + "mean_token_accuracy": 0.7426408231258392, + "num_tokens": 86076110.0, + "step": 37230 + }, + { + "epoch": 0.34143210782066563, + "learning_rate": 0.00013171541212065644, + "loss": 0.8628, + "mean_token_accuracy": 0.7432761430740357, + "num_tokens": 86099801.0, + "step": 37240 + }, + { + "epoch": 0.3415237920601449, + "learning_rate": 0.00013169707527276064, + "loss": 0.8363, + "mean_token_accuracy": 0.7503327965736389, + "num_tokens": 86121711.0, + "step": 37250 + }, + { + "epoch": 0.3416154762996241, + "learning_rate": 0.00013167873842486477, + "loss": 0.8342, + "mean_token_accuracy": 0.7504224061965943, + "num_tokens": 86144332.0, + "step": 37260 + }, + { + "epoch": 0.3417071605391033, + "learning_rate": 0.00013166040157696894, + "loss": 0.8687, + "mean_token_accuracy": 0.7470543205738067, + "num_tokens": 86167057.0, + "step": 37270 + }, + { + "epoch": 0.3417988447785826, + "learning_rate": 0.00013164206472907308, + "loss": 0.8734, + "mean_token_accuracy": 0.7430323839187623, + "num_tokens": 86190290.0, + "step": 37280 + }, + { + "epoch": 0.3418905290180618, + "learning_rate": 0.00013162372788117722, + "loss": 0.8017, + "mean_token_accuracy": 0.7559139013290406, + "num_tokens": 86213506.0, + "step": 37290 + }, + { + "epoch": 0.341982213257541, + "learning_rate": 0.00013160539103328138, + "loss": 0.8784, + "mean_token_accuracy": 0.7396174609661103, + "num_tokens": 86236711.0, + "step": 37300 + }, + { + "epoch": 0.3420738974970203, + "learning_rate": 0.00013158705418538552, + "loss": 0.8313, + "mean_token_accuracy": 0.7533867299556732, + "num_tokens": 86259182.0, + "step": 37310 + }, + { + "epoch": 0.34216558173649947, + "learning_rate": 0.0001315687173374897, + "loss": 0.8585, + "mean_token_accuracy": 0.7477795958518982, + "num_tokens": 86282316.0, + "step": 37320 + }, + { + "epoch": 0.3422572659759787, + "learning_rate": 0.00013155038048959385, + "loss": 0.8353, + "mean_token_accuracy": 0.7535763680934906, + "num_tokens": 86305575.0, + "step": 37330 + }, + { + "epoch": 0.34234895021545797, + "learning_rate": 0.000131532043641698, + "loss": 0.8176, + "mean_token_accuracy": 0.7536270260810852, + "num_tokens": 86329018.0, + "step": 37340 + }, + { + "epoch": 0.3424406344549372, + "learning_rate": 0.00013151370679380216, + "loss": 0.8741, + "mean_token_accuracy": 0.7423791468143464, + "num_tokens": 86352916.0, + "step": 37350 + }, + { + "epoch": 0.3425323186944164, + "learning_rate": 0.0001314953699459063, + "loss": 0.8224, + "mean_token_accuracy": 0.7576164901256561, + "num_tokens": 86375967.0, + "step": 37360 + }, + { + "epoch": 0.34262400293389567, + "learning_rate": 0.00013147703309801046, + "loss": 0.8772, + "mean_token_accuracy": 0.7445416212081909, + "num_tokens": 86398528.0, + "step": 37370 + }, + { + "epoch": 0.3427156871733749, + "learning_rate": 0.00013145869625011462, + "loss": 0.8697, + "mean_token_accuracy": 0.744277560710907, + "num_tokens": 86421102.0, + "step": 37380 + }, + { + "epoch": 0.3428073714128541, + "learning_rate": 0.00013144035940221876, + "loss": 0.8242, + "mean_token_accuracy": 0.7569944679737091, + "num_tokens": 86444589.0, + "step": 37390 + }, + { + "epoch": 0.34289905565233336, + "learning_rate": 0.00013142202255432293, + "loss": 0.8486, + "mean_token_accuracy": 0.7452614784240723, + "num_tokens": 86468504.0, + "step": 37400 + }, + { + "epoch": 0.3429907398918126, + "learning_rate": 0.00013140368570642707, + "loss": 0.8209, + "mean_token_accuracy": 0.7482340097427368, + "num_tokens": 86491017.0, + "step": 37410 + }, + { + "epoch": 0.3430824241312918, + "learning_rate": 0.00013138534885853123, + "loss": 0.8459, + "mean_token_accuracy": 0.7495341420173645, + "num_tokens": 86513521.0, + "step": 37420 + }, + { + "epoch": 0.34317410837077106, + "learning_rate": 0.00013136701201063537, + "loss": 0.8612, + "mean_token_accuracy": 0.7421615958213806, + "num_tokens": 86536788.0, + "step": 37430 + }, + { + "epoch": 0.3432657926102503, + "learning_rate": 0.0001313486751627395, + "loss": 0.8645, + "mean_token_accuracy": 0.7407772898674011, + "num_tokens": 86559493.0, + "step": 37440 + }, + { + "epoch": 0.3433574768497295, + "learning_rate": 0.0001313303383148437, + "loss": 0.8773, + "mean_token_accuracy": 0.7429486989974976, + "num_tokens": 86582716.0, + "step": 37450 + }, + { + "epoch": 0.34344916108920875, + "learning_rate": 0.00013131200146694784, + "loss": 0.8771, + "mean_token_accuracy": 0.7355626225471497, + "num_tokens": 86605360.0, + "step": 37460 + }, + { + "epoch": 0.343540845328688, + "learning_rate": 0.000131293664619052, + "loss": 0.823, + "mean_token_accuracy": 0.7481252431869507, + "num_tokens": 86629032.0, + "step": 37470 + }, + { + "epoch": 0.34363252956816726, + "learning_rate": 0.00013127532777115614, + "loss": 0.8831, + "mean_token_accuracy": 0.7385040998458863, + "num_tokens": 86651654.0, + "step": 37480 + }, + { + "epoch": 0.34372421380764645, + "learning_rate": 0.00013125699092326028, + "loss": 0.8448, + "mean_token_accuracy": 0.7508082270622254, + "num_tokens": 86674558.0, + "step": 37490 + }, + { + "epoch": 0.3438158980471257, + "learning_rate": 0.00013123865407536445, + "loss": 0.8501, + "mean_token_accuracy": 0.7485431969165802, + "num_tokens": 86697438.0, + "step": 37500 + }, + { + "epoch": 0.34390758228660495, + "learning_rate": 0.0001312203172274686, + "loss": 0.8621, + "mean_token_accuracy": 0.7432440876960754, + "num_tokens": 86720289.0, + "step": 37510 + }, + { + "epoch": 0.34399926652608415, + "learning_rate": 0.00013120198037957278, + "loss": 0.857, + "mean_token_accuracy": 0.7458439469337463, + "num_tokens": 86743169.0, + "step": 37520 + }, + { + "epoch": 0.3440909507655634, + "learning_rate": 0.00013118364353167692, + "loss": 0.8592, + "mean_token_accuracy": 0.7406644225120544, + "num_tokens": 86765674.0, + "step": 37530 + }, + { + "epoch": 0.34418263500504265, + "learning_rate": 0.00013116530668378105, + "loss": 0.8136, + "mean_token_accuracy": 0.7552064299583435, + "num_tokens": 86788919.0, + "step": 37540 + }, + { + "epoch": 0.34427431924452184, + "learning_rate": 0.00013114696983588522, + "loss": 0.8192, + "mean_token_accuracy": 0.7529111206531525, + "num_tokens": 86811614.0, + "step": 37550 + }, + { + "epoch": 0.3443660034840011, + "learning_rate": 0.00013112863298798936, + "loss": 0.8744, + "mean_token_accuracy": 0.7411521255970002, + "num_tokens": 86834577.0, + "step": 37560 + }, + { + "epoch": 0.34445768772348034, + "learning_rate": 0.00013111029614009352, + "loss": 0.8639, + "mean_token_accuracy": 0.7424495041370391, + "num_tokens": 86857501.0, + "step": 37570 + }, + { + "epoch": 0.3445493719629596, + "learning_rate": 0.0001310919592921977, + "loss": 0.8342, + "mean_token_accuracy": 0.7537790715694428, + "num_tokens": 86880464.0, + "step": 37580 + }, + { + "epoch": 0.3446410562024388, + "learning_rate": 0.00013107362244430183, + "loss": 0.8501, + "mean_token_accuracy": 0.742199969291687, + "num_tokens": 86902963.0, + "step": 37590 + }, + { + "epoch": 0.34473274044191804, + "learning_rate": 0.000131055285596406, + "loss": 0.8852, + "mean_token_accuracy": 0.7372816562652588, + "num_tokens": 86927118.0, + "step": 37600 + }, + { + "epoch": 0.3448244246813973, + "learning_rate": 0.00013103694874851013, + "loss": 0.9019, + "mean_token_accuracy": 0.7293107867240906, + "num_tokens": 86950308.0, + "step": 37610 + }, + { + "epoch": 0.3449161089208765, + "learning_rate": 0.0001310186119006143, + "loss": 0.824, + "mean_token_accuracy": 0.7526019752025604, + "num_tokens": 86973391.0, + "step": 37620 + }, + { + "epoch": 0.34500779316035574, + "learning_rate": 0.00013100027505271843, + "loss": 0.8521, + "mean_token_accuracy": 0.7496634900569916, + "num_tokens": 86997271.0, + "step": 37630 + }, + { + "epoch": 0.345099477399835, + "learning_rate": 0.0001309819382048226, + "loss": 0.8726, + "mean_token_accuracy": 0.7416471123695374, + "num_tokens": 87020380.0, + "step": 37640 + }, + { + "epoch": 0.3451911616393142, + "learning_rate": 0.00013096360135692677, + "loss": 0.8231, + "mean_token_accuracy": 0.7499141097068787, + "num_tokens": 87043012.0, + "step": 37650 + }, + { + "epoch": 0.34528284587879343, + "learning_rate": 0.0001309452645090309, + "loss": 0.8591, + "mean_token_accuracy": 0.7471584260463715, + "num_tokens": 87066014.0, + "step": 37660 + }, + { + "epoch": 0.3453745301182727, + "learning_rate": 0.00013092692766113507, + "loss": 0.858, + "mean_token_accuracy": 0.7428099274635315, + "num_tokens": 87089163.0, + "step": 37670 + }, + { + "epoch": 0.3454662143577519, + "learning_rate": 0.0001309085908132392, + "loss": 0.8687, + "mean_token_accuracy": 0.7425667703151703, + "num_tokens": 87111221.0, + "step": 37680 + }, + { + "epoch": 0.34555789859723113, + "learning_rate": 0.00013089025396534335, + "loss": 0.8447, + "mean_token_accuracy": 0.7500782668590545, + "num_tokens": 87134521.0, + "step": 37690 + }, + { + "epoch": 0.3456495828367104, + "learning_rate": 0.0001308719171174475, + "loss": 0.8828, + "mean_token_accuracy": 0.7427931904792786, + "num_tokens": 87157449.0, + "step": 37700 + }, + { + "epoch": 0.34574126707618963, + "learning_rate": 0.00013085358026955168, + "loss": 0.8773, + "mean_token_accuracy": 0.7426659226417541, + "num_tokens": 87180357.0, + "step": 37710 + }, + { + "epoch": 0.3458329513156688, + "learning_rate": 0.00013083524342165584, + "loss": 0.8455, + "mean_token_accuracy": 0.7439717769622802, + "num_tokens": 87203970.0, + "step": 37720 + }, + { + "epoch": 0.3459246355551481, + "learning_rate": 0.00013081690657375998, + "loss": 0.8538, + "mean_token_accuracy": 0.7418691635131835, + "num_tokens": 87227687.0, + "step": 37730 + }, + { + "epoch": 0.3460163197946273, + "learning_rate": 0.00013079856972586412, + "loss": 0.8219, + "mean_token_accuracy": 0.744043642282486, + "num_tokens": 87251269.0, + "step": 37740 + }, + { + "epoch": 0.3461080040341065, + "learning_rate": 0.00013078023287796828, + "loss": 0.8685, + "mean_token_accuracy": 0.744477504491806, + "num_tokens": 87273693.0, + "step": 37750 + }, + { + "epoch": 0.34619968827358577, + "learning_rate": 0.00013076189603007242, + "loss": 0.8315, + "mean_token_accuracy": 0.7536784887313843, + "num_tokens": 87296790.0, + "step": 37760 + }, + { + "epoch": 0.346291372513065, + "learning_rate": 0.0001307435591821766, + "loss": 0.8365, + "mean_token_accuracy": 0.7495584964752198, + "num_tokens": 87319613.0, + "step": 37770 + }, + { + "epoch": 0.3463830567525442, + "learning_rate": 0.00013072522233428075, + "loss": 0.8577, + "mean_token_accuracy": 0.741416972875595, + "num_tokens": 87342338.0, + "step": 37780 + }, + { + "epoch": 0.34647474099202347, + "learning_rate": 0.0001307068854863849, + "loss": 0.8245, + "mean_token_accuracy": 0.7562924802303315, + "num_tokens": 87365148.0, + "step": 37790 + }, + { + "epoch": 0.3465664252315027, + "learning_rate": 0.00013068854863848906, + "loss": 0.8291, + "mean_token_accuracy": 0.7532803475856781, + "num_tokens": 87388057.0, + "step": 37800 + }, + { + "epoch": 0.3466581094709819, + "learning_rate": 0.0001306702117905932, + "loss": 0.8232, + "mean_token_accuracy": 0.7507896840572357, + "num_tokens": 87411028.0, + "step": 37810 + }, + { + "epoch": 0.34674979371046116, + "learning_rate": 0.00013065187494269736, + "loss": 0.8323, + "mean_token_accuracy": 0.7489738523960113, + "num_tokens": 87435038.0, + "step": 37820 + }, + { + "epoch": 0.3468414779499404, + "learning_rate": 0.0001306335380948015, + "loss": 0.8617, + "mean_token_accuracy": 0.7449505984783172, + "num_tokens": 87458597.0, + "step": 37830 + }, + { + "epoch": 0.34693316218941966, + "learning_rate": 0.00013061520124690566, + "loss": 0.8692, + "mean_token_accuracy": 0.7353573739528656, + "num_tokens": 87481060.0, + "step": 37840 + }, + { + "epoch": 0.34702484642889886, + "learning_rate": 0.00013059686439900983, + "loss": 0.8923, + "mean_token_accuracy": 0.7383727550506591, + "num_tokens": 87504648.0, + "step": 37850 + }, + { + "epoch": 0.3471165306683781, + "learning_rate": 0.00013057852755111397, + "loss": 0.8376, + "mean_token_accuracy": 0.7521066486835479, + "num_tokens": 87527636.0, + "step": 37860 + }, + { + "epoch": 0.34720821490785736, + "learning_rate": 0.00013056019070321813, + "loss": 0.8213, + "mean_token_accuracy": 0.748869800567627, + "num_tokens": 87550078.0, + "step": 37870 + }, + { + "epoch": 0.34729989914733655, + "learning_rate": 0.00013054185385532227, + "loss": 0.8356, + "mean_token_accuracy": 0.7438906967639923, + "num_tokens": 87572798.0, + "step": 37880 + }, + { + "epoch": 0.3473915833868158, + "learning_rate": 0.0001305235170074264, + "loss": 0.8193, + "mean_token_accuracy": 0.7509337663650513, + "num_tokens": 87595912.0, + "step": 37890 + }, + { + "epoch": 0.34748326762629506, + "learning_rate": 0.0001305051801595306, + "loss": 0.8567, + "mean_token_accuracy": 0.7424492061138153, + "num_tokens": 87618768.0, + "step": 37900 + }, + { + "epoch": 0.34757495186577425, + "learning_rate": 0.00013048684331163474, + "loss": 0.8203, + "mean_token_accuracy": 0.7546485662460327, + "num_tokens": 87642943.0, + "step": 37910 + }, + { + "epoch": 0.3476666361052535, + "learning_rate": 0.0001304685064637389, + "loss": 0.8419, + "mean_token_accuracy": 0.7400360822677612, + "num_tokens": 87666185.0, + "step": 37920 + }, + { + "epoch": 0.34775832034473275, + "learning_rate": 0.00013045016961584304, + "loss": 0.843, + "mean_token_accuracy": 0.7454596698284149, + "num_tokens": 87688712.0, + "step": 37930 + }, + { + "epoch": 0.34785000458421195, + "learning_rate": 0.00013043183276794718, + "loss": 0.8901, + "mean_token_accuracy": 0.7401292622089386, + "num_tokens": 87711469.0, + "step": 37940 + }, + { + "epoch": 0.3479416888236912, + "learning_rate": 0.00013041349592005135, + "loss": 0.8863, + "mean_token_accuracy": 0.7317825496196747, + "num_tokens": 87733921.0, + "step": 37950 + }, + { + "epoch": 0.34803337306317045, + "learning_rate": 0.0001303951590721555, + "loss": 0.8743, + "mean_token_accuracy": 0.7413212358951569, + "num_tokens": 87756943.0, + "step": 37960 + }, + { + "epoch": 0.3481250573026497, + "learning_rate": 0.00013037682222425965, + "loss": 0.8531, + "mean_token_accuracy": 0.7407483100891114, + "num_tokens": 87779530.0, + "step": 37970 + }, + { + "epoch": 0.3482167415421289, + "learning_rate": 0.00013035848537636382, + "loss": 0.8558, + "mean_token_accuracy": 0.7409225344657898, + "num_tokens": 87802282.0, + "step": 37980 + }, + { + "epoch": 0.34830842578160814, + "learning_rate": 0.00013034014852846796, + "loss": 0.8453, + "mean_token_accuracy": 0.7477506041526795, + "num_tokens": 87824812.0, + "step": 37990 + }, + { + "epoch": 0.3484001100210874, + "learning_rate": 0.00013032181168057212, + "loss": 0.8426, + "mean_token_accuracy": 0.7458292841911316, + "num_tokens": 87847989.0, + "step": 38000 + }, + { + "epoch": 0.3484917942605666, + "learning_rate": 0.00013030347483267626, + "loss": 0.8286, + "mean_token_accuracy": 0.7489347279071807, + "num_tokens": 87870754.0, + "step": 38010 + }, + { + "epoch": 0.34858347850004584, + "learning_rate": 0.00013028513798478043, + "loss": 0.8477, + "mean_token_accuracy": 0.7397971987724304, + "num_tokens": 87894222.0, + "step": 38020 + }, + { + "epoch": 0.3486751627395251, + "learning_rate": 0.0001302668011368846, + "loss": 0.8408, + "mean_token_accuracy": 0.7475711643695832, + "num_tokens": 87917482.0, + "step": 38030 + }, + { + "epoch": 0.3487668469790043, + "learning_rate": 0.00013024846428898873, + "loss": 0.8524, + "mean_token_accuracy": 0.7466792702674866, + "num_tokens": 87939990.0, + "step": 38040 + }, + { + "epoch": 0.34885853121848354, + "learning_rate": 0.0001302301274410929, + "loss": 0.8713, + "mean_token_accuracy": 0.740998363494873, + "num_tokens": 87963274.0, + "step": 38050 + }, + { + "epoch": 0.3489502154579628, + "learning_rate": 0.00013021179059319703, + "loss": 0.7988, + "mean_token_accuracy": 0.7589530646800995, + "num_tokens": 87985674.0, + "step": 38060 + }, + { + "epoch": 0.34904189969744204, + "learning_rate": 0.0001301934537453012, + "loss": 0.8429, + "mean_token_accuracy": 0.7426394581794739, + "num_tokens": 88008767.0, + "step": 38070 + }, + { + "epoch": 0.34913358393692123, + "learning_rate": 0.00013017511689740534, + "loss": 0.8585, + "mean_token_accuracy": 0.740776801109314, + "num_tokens": 88032679.0, + "step": 38080 + }, + { + "epoch": 0.3492252681764005, + "learning_rate": 0.00013015678004950947, + "loss": 0.8563, + "mean_token_accuracy": 0.7444301605224609, + "num_tokens": 88055877.0, + "step": 38090 + }, + { + "epoch": 0.34931695241587973, + "learning_rate": 0.00013013844320161367, + "loss": 0.8585, + "mean_token_accuracy": 0.7415159523487092, + "num_tokens": 88079298.0, + "step": 38100 + }, + { + "epoch": 0.34940863665535893, + "learning_rate": 0.0001301201063537178, + "loss": 0.8382, + "mean_token_accuracy": 0.7479581534862518, + "num_tokens": 88102502.0, + "step": 38110 + }, + { + "epoch": 0.3495003208948382, + "learning_rate": 0.00013010176950582197, + "loss": 0.8498, + "mean_token_accuracy": 0.7455908417701721, + "num_tokens": 88125584.0, + "step": 38120 + }, + { + "epoch": 0.34959200513431743, + "learning_rate": 0.0001300834326579261, + "loss": 0.8383, + "mean_token_accuracy": 0.7464239716529846, + "num_tokens": 88148301.0, + "step": 38130 + }, + { + "epoch": 0.3496836893737966, + "learning_rate": 0.00013006509581003025, + "loss": 0.8461, + "mean_token_accuracy": 0.7454171359539032, + "num_tokens": 88171274.0, + "step": 38140 + }, + { + "epoch": 0.3497753736132759, + "learning_rate": 0.0001300467589621344, + "loss": 0.8529, + "mean_token_accuracy": 0.750511234998703, + "num_tokens": 88194919.0, + "step": 38150 + }, + { + "epoch": 0.3498670578527551, + "learning_rate": 0.00013002842211423858, + "loss": 0.8374, + "mean_token_accuracy": 0.7474356830120087, + "num_tokens": 88217787.0, + "step": 38160 + }, + { + "epoch": 0.3499587420922343, + "learning_rate": 0.00013001008526634272, + "loss": 0.8546, + "mean_token_accuracy": 0.7470196425914765, + "num_tokens": 88240788.0, + "step": 38170 + }, + { + "epoch": 0.35005042633171357, + "learning_rate": 0.00012999174841844688, + "loss": 0.8642, + "mean_token_accuracy": 0.7350736796855927, + "num_tokens": 88262889.0, + "step": 38180 + }, + { + "epoch": 0.3501421105711928, + "learning_rate": 0.00012997341157055102, + "loss": 0.8467, + "mean_token_accuracy": 0.7441868960857392, + "num_tokens": 88285565.0, + "step": 38190 + }, + { + "epoch": 0.35023379481067207, + "learning_rate": 0.00012995507472265519, + "loss": 0.8861, + "mean_token_accuracy": 0.7338118314743042, + "num_tokens": 88308280.0, + "step": 38200 + }, + { + "epoch": 0.35032547905015127, + "learning_rate": 0.00012993673787475932, + "loss": 0.9061, + "mean_token_accuracy": 0.7339636385440826, + "num_tokens": 88330976.0, + "step": 38210 + }, + { + "epoch": 0.3504171632896305, + "learning_rate": 0.0001299184010268635, + "loss": 0.8417, + "mean_token_accuracy": 0.7496311962604523, + "num_tokens": 88353606.0, + "step": 38220 + }, + { + "epoch": 0.35050884752910977, + "learning_rate": 0.00012990006417896765, + "loss": 0.8338, + "mean_token_accuracy": 0.7457334578037262, + "num_tokens": 88375937.0, + "step": 38230 + }, + { + "epoch": 0.35060053176858896, + "learning_rate": 0.0001298817273310718, + "loss": 0.8359, + "mean_token_accuracy": 0.7450960040092468, + "num_tokens": 88398913.0, + "step": 38240 + }, + { + "epoch": 0.3506922160080682, + "learning_rate": 0.00012986339048317596, + "loss": 0.8332, + "mean_token_accuracy": 0.7556888043880463, + "num_tokens": 88422414.0, + "step": 38250 + }, + { + "epoch": 0.35078390024754746, + "learning_rate": 0.0001298450536352801, + "loss": 0.8166, + "mean_token_accuracy": 0.7548144578933715, + "num_tokens": 88445186.0, + "step": 38260 + }, + { + "epoch": 0.35087558448702666, + "learning_rate": 0.00012982671678738426, + "loss": 0.8977, + "mean_token_accuracy": 0.7276447057723999, + "num_tokens": 88468663.0, + "step": 38270 + }, + { + "epoch": 0.3509672687265059, + "learning_rate": 0.0001298083799394884, + "loss": 0.8698, + "mean_token_accuracy": 0.7385667145252228, + "num_tokens": 88491986.0, + "step": 38280 + }, + { + "epoch": 0.35105895296598516, + "learning_rate": 0.00012979004309159257, + "loss": 0.8491, + "mean_token_accuracy": 0.7474011480808258, + "num_tokens": 88515616.0, + "step": 38290 + }, + { + "epoch": 0.35115063720546436, + "learning_rate": 0.00012977170624369673, + "loss": 0.8339, + "mean_token_accuracy": 0.7485447883605957, + "num_tokens": 88538853.0, + "step": 38300 + }, + { + "epoch": 0.3512423214449436, + "learning_rate": 0.00012975336939580087, + "loss": 0.8446, + "mean_token_accuracy": 0.7485349535942077, + "num_tokens": 88562617.0, + "step": 38310 + }, + { + "epoch": 0.35133400568442286, + "learning_rate": 0.00012973503254790504, + "loss": 0.8427, + "mean_token_accuracy": 0.749411553144455, + "num_tokens": 88585428.0, + "step": 38320 + }, + { + "epoch": 0.3514256899239021, + "learning_rate": 0.00012971669570000917, + "loss": 0.8661, + "mean_token_accuracy": 0.7448081552982331, + "num_tokens": 88609616.0, + "step": 38330 + }, + { + "epoch": 0.3515173741633813, + "learning_rate": 0.0001296983588521133, + "loss": 0.7972, + "mean_token_accuracy": 0.762670373916626, + "num_tokens": 88632131.0, + "step": 38340 + }, + { + "epoch": 0.35160905840286055, + "learning_rate": 0.00012968002200421748, + "loss": 0.8628, + "mean_token_accuracy": 0.7470655024051667, + "num_tokens": 88655781.0, + "step": 38350 + }, + { + "epoch": 0.3517007426423398, + "learning_rate": 0.00012966168515632164, + "loss": 0.8415, + "mean_token_accuracy": 0.7441945314407349, + "num_tokens": 88679327.0, + "step": 38360 + }, + { + "epoch": 0.351792426881819, + "learning_rate": 0.00012964334830842578, + "loss": 0.8707, + "mean_token_accuracy": 0.7448734819889069, + "num_tokens": 88703165.0, + "step": 38370 + }, + { + "epoch": 0.35188411112129825, + "learning_rate": 0.00012962501146052995, + "loss": 0.8312, + "mean_token_accuracy": 0.7476518809795379, + "num_tokens": 88726363.0, + "step": 38380 + }, + { + "epoch": 0.3519757953607775, + "learning_rate": 0.00012960667461263408, + "loss": 0.8249, + "mean_token_accuracy": 0.757578718662262, + "num_tokens": 88750254.0, + "step": 38390 + }, + { + "epoch": 0.3520674796002567, + "learning_rate": 0.00012958833776473825, + "loss": 0.8694, + "mean_token_accuracy": 0.7445272147655487, + "num_tokens": 88774885.0, + "step": 38400 + }, + { + "epoch": 0.35215916383973594, + "learning_rate": 0.0001295700009168424, + "loss": 0.854, + "mean_token_accuracy": 0.7485789954662323, + "num_tokens": 88798150.0, + "step": 38410 + }, + { + "epoch": 0.3522508480792152, + "learning_rate": 0.00012955166406894655, + "loss": 0.8862, + "mean_token_accuracy": 0.7371294021606445, + "num_tokens": 88820933.0, + "step": 38420 + }, + { + "epoch": 0.3523425323186944, + "learning_rate": 0.00012953332722105072, + "loss": 0.8318, + "mean_token_accuracy": 0.7497548401355744, + "num_tokens": 88844233.0, + "step": 38430 + }, + { + "epoch": 0.35243421655817364, + "learning_rate": 0.00012951499037315486, + "loss": 0.8868, + "mean_token_accuracy": 0.744812297821045, + "num_tokens": 88867769.0, + "step": 38440 + }, + { + "epoch": 0.3525259007976529, + "learning_rate": 0.00012949665352525902, + "loss": 0.8434, + "mean_token_accuracy": 0.7472955286502838, + "num_tokens": 88891327.0, + "step": 38450 + }, + { + "epoch": 0.35261758503713214, + "learning_rate": 0.00012947831667736316, + "loss": 0.8129, + "mean_token_accuracy": 0.761379873752594, + "num_tokens": 88914666.0, + "step": 38460 + }, + { + "epoch": 0.35270926927661134, + "learning_rate": 0.00012945997982946733, + "loss": 0.7881, + "mean_token_accuracy": 0.7566261053085327, + "num_tokens": 88936929.0, + "step": 38470 + }, + { + "epoch": 0.3528009535160906, + "learning_rate": 0.00012944164298157147, + "loss": 0.8293, + "mean_token_accuracy": 0.7504927217960358, + "num_tokens": 88960216.0, + "step": 38480 + }, + { + "epoch": 0.35289263775556984, + "learning_rate": 0.00012942330613367563, + "loss": 0.8671, + "mean_token_accuracy": 0.7413956522941589, + "num_tokens": 88983905.0, + "step": 38490 + }, + { + "epoch": 0.35298432199504903, + "learning_rate": 0.0001294049692857798, + "loss": 0.8044, + "mean_token_accuracy": 0.7506045043468476, + "num_tokens": 89007115.0, + "step": 38500 + }, + { + "epoch": 0.3530760062345283, + "learning_rate": 0.00012938663243788393, + "loss": 0.8731, + "mean_token_accuracy": 0.7386382818222046, + "num_tokens": 89030435.0, + "step": 38510 + }, + { + "epoch": 0.35316769047400753, + "learning_rate": 0.0001293682955899881, + "loss": 0.8282, + "mean_token_accuracy": 0.7485121607780456, + "num_tokens": 89053089.0, + "step": 38520 + }, + { + "epoch": 0.35325937471348673, + "learning_rate": 0.00012934995874209224, + "loss": 0.8346, + "mean_token_accuracy": 0.7461729288101197, + "num_tokens": 89075910.0, + "step": 38530 + }, + { + "epoch": 0.353351058952966, + "learning_rate": 0.00012933162189419638, + "loss": 0.8876, + "mean_token_accuracy": 0.7396175980567932, + "num_tokens": 89098818.0, + "step": 38540 + }, + { + "epoch": 0.35344274319244523, + "learning_rate": 0.00012931328504630054, + "loss": 0.8523, + "mean_token_accuracy": 0.7416675686836243, + "num_tokens": 89121559.0, + "step": 38550 + }, + { + "epoch": 0.3535344274319244, + "learning_rate": 0.0001292949481984047, + "loss": 0.8591, + "mean_token_accuracy": 0.7444033920764923, + "num_tokens": 89144569.0, + "step": 38560 + }, + { + "epoch": 0.3536261116714037, + "learning_rate": 0.00012927661135050885, + "loss": 0.8554, + "mean_token_accuracy": 0.7391893625259399, + "num_tokens": 89167488.0, + "step": 38570 + }, + { + "epoch": 0.3537177959108829, + "learning_rate": 0.000129258274502613, + "loss": 0.8595, + "mean_token_accuracy": 0.7431459367275238, + "num_tokens": 89191087.0, + "step": 38580 + }, + { + "epoch": 0.3538094801503622, + "learning_rate": 0.00012923993765471715, + "loss": 0.8943, + "mean_token_accuracy": 0.7316861569881439, + "num_tokens": 89214751.0, + "step": 38590 + }, + { + "epoch": 0.35390116438984137, + "learning_rate": 0.00012922160080682131, + "loss": 0.8157, + "mean_token_accuracy": 0.7547654986381531, + "num_tokens": 89237541.0, + "step": 38600 + }, + { + "epoch": 0.3539928486293206, + "learning_rate": 0.00012920326395892545, + "loss": 0.8402, + "mean_token_accuracy": 0.7504114627838134, + "num_tokens": 89261000.0, + "step": 38610 + }, + { + "epoch": 0.3540845328687999, + "learning_rate": 0.00012918492711102962, + "loss": 0.8761, + "mean_token_accuracy": 0.7410715520381927, + "num_tokens": 89284352.0, + "step": 38620 + }, + { + "epoch": 0.35417621710827907, + "learning_rate": 0.00012916659026313378, + "loss": 0.8579, + "mean_token_accuracy": 0.7444826424121856, + "num_tokens": 89307059.0, + "step": 38630 + }, + { + "epoch": 0.3542679013477583, + "learning_rate": 0.00012914825341523792, + "loss": 0.8555, + "mean_token_accuracy": 0.7434938609600067, + "num_tokens": 89329848.0, + "step": 38640 + }, + { + "epoch": 0.35435958558723757, + "learning_rate": 0.0001291299165673421, + "loss": 0.8214, + "mean_token_accuracy": 0.7490093350410462, + "num_tokens": 89352610.0, + "step": 38650 + }, + { + "epoch": 0.35445126982671676, + "learning_rate": 0.00012911157971944623, + "loss": 0.8965, + "mean_token_accuracy": 0.7354145407676697, + "num_tokens": 89375348.0, + "step": 38660 + }, + { + "epoch": 0.354542954066196, + "learning_rate": 0.0001290932428715504, + "loss": 0.8358, + "mean_token_accuracy": 0.7552769839763641, + "num_tokens": 89398362.0, + "step": 38670 + }, + { + "epoch": 0.35463463830567526, + "learning_rate": 0.00012907490602365453, + "loss": 0.8434, + "mean_token_accuracy": 0.7459128439426422, + "num_tokens": 89421632.0, + "step": 38680 + }, + { + "epoch": 0.3547263225451545, + "learning_rate": 0.0001290565691757587, + "loss": 0.8657, + "mean_token_accuracy": 0.7391178250312805, + "num_tokens": 89444958.0, + "step": 38690 + }, + { + "epoch": 0.3548180067846337, + "learning_rate": 0.00012903823232786286, + "loss": 0.8234, + "mean_token_accuracy": 0.7508709132671356, + "num_tokens": 89468517.0, + "step": 38700 + }, + { + "epoch": 0.35490969102411296, + "learning_rate": 0.000129019895479967, + "loss": 0.8756, + "mean_token_accuracy": 0.7424369275569915, + "num_tokens": 89491319.0, + "step": 38710 + }, + { + "epoch": 0.3550013752635922, + "learning_rate": 0.00012900155863207116, + "loss": 0.859, + "mean_token_accuracy": 0.741323322057724, + "num_tokens": 89513835.0, + "step": 38720 + }, + { + "epoch": 0.3550930595030714, + "learning_rate": 0.0001289832217841753, + "loss": 0.843, + "mean_token_accuracy": 0.7459016382694245, + "num_tokens": 89535923.0, + "step": 38730 + }, + { + "epoch": 0.35518474374255066, + "learning_rate": 0.00012896488493627944, + "loss": 0.8435, + "mean_token_accuracy": 0.7381949424743652, + "num_tokens": 89558352.0, + "step": 38740 + }, + { + "epoch": 0.3552764279820299, + "learning_rate": 0.00012894654808838363, + "loss": 0.8768, + "mean_token_accuracy": 0.7390536606311798, + "num_tokens": 89581438.0, + "step": 38750 + }, + { + "epoch": 0.3553681122215091, + "learning_rate": 0.00012892821124048777, + "loss": 0.8552, + "mean_token_accuracy": 0.7429502248764038, + "num_tokens": 89604468.0, + "step": 38760 + }, + { + "epoch": 0.35545979646098835, + "learning_rate": 0.0001289098743925919, + "loss": 0.8377, + "mean_token_accuracy": 0.7495685458183289, + "num_tokens": 89627744.0, + "step": 38770 + }, + { + "epoch": 0.3555514807004676, + "learning_rate": 0.00012889153754469608, + "loss": 0.7933, + "mean_token_accuracy": 0.760120975971222, + "num_tokens": 89650348.0, + "step": 38780 + }, + { + "epoch": 0.3556431649399468, + "learning_rate": 0.00012887320069680021, + "loss": 0.8458, + "mean_token_accuracy": 0.7500900089740753, + "num_tokens": 89672996.0, + "step": 38790 + }, + { + "epoch": 0.35573484917942605, + "learning_rate": 0.00012885486384890438, + "loss": 0.8472, + "mean_token_accuracy": 0.7481849253177643, + "num_tokens": 89695909.0, + "step": 38800 + }, + { + "epoch": 0.3558265334189053, + "learning_rate": 0.00012883652700100852, + "loss": 0.8369, + "mean_token_accuracy": 0.7435585975646972, + "num_tokens": 89719193.0, + "step": 38810 + }, + { + "epoch": 0.35591821765838455, + "learning_rate": 0.00012881819015311268, + "loss": 0.8693, + "mean_token_accuracy": 0.7380140542984008, + "num_tokens": 89742571.0, + "step": 38820 + }, + { + "epoch": 0.35600990189786375, + "learning_rate": 0.00012879985330521685, + "loss": 0.8536, + "mean_token_accuracy": 0.7438553154468537, + "num_tokens": 89765541.0, + "step": 38830 + }, + { + "epoch": 0.356101586137343, + "learning_rate": 0.000128781516457321, + "loss": 0.8287, + "mean_token_accuracy": 0.7518167436122895, + "num_tokens": 89788947.0, + "step": 38840 + }, + { + "epoch": 0.35619327037682225, + "learning_rate": 0.00012876317960942515, + "loss": 0.8549, + "mean_token_accuracy": 0.7409891963005066, + "num_tokens": 89812581.0, + "step": 38850 + }, + { + "epoch": 0.35628495461630144, + "learning_rate": 0.0001287448427615293, + "loss": 0.8367, + "mean_token_accuracy": 0.7552560925483703, + "num_tokens": 89835979.0, + "step": 38860 + }, + { + "epoch": 0.3563766388557807, + "learning_rate": 0.00012872650591363346, + "loss": 0.8899, + "mean_token_accuracy": 0.738469660282135, + "num_tokens": 89859430.0, + "step": 38870 + }, + { + "epoch": 0.35646832309525994, + "learning_rate": 0.00012870816906573762, + "loss": 0.8423, + "mean_token_accuracy": 0.7447143912315368, + "num_tokens": 89881839.0, + "step": 38880 + }, + { + "epoch": 0.35656000733473914, + "learning_rate": 0.00012868983221784176, + "loss": 0.8659, + "mean_token_accuracy": 0.7414678514003754, + "num_tokens": 89905307.0, + "step": 38890 + }, + { + "epoch": 0.3566516915742184, + "learning_rate": 0.00012867149536994592, + "loss": 0.8785, + "mean_token_accuracy": 0.7430894374847412, + "num_tokens": 89927163.0, + "step": 38900 + }, + { + "epoch": 0.35674337581369764, + "learning_rate": 0.00012865315852205006, + "loss": 0.8438, + "mean_token_accuracy": 0.7401298344135284, + "num_tokens": 89949534.0, + "step": 38910 + }, + { + "epoch": 0.35683506005317683, + "learning_rate": 0.00012863482167415423, + "loss": 0.8889, + "mean_token_accuracy": 0.732297396659851, + "num_tokens": 89972443.0, + "step": 38920 + }, + { + "epoch": 0.3569267442926561, + "learning_rate": 0.00012861648482625837, + "loss": 0.8917, + "mean_token_accuracy": 0.7350900173187256, + "num_tokens": 89996057.0, + "step": 38930 + }, + { + "epoch": 0.35701842853213533, + "learning_rate": 0.0001285981479783625, + "loss": 0.8232, + "mean_token_accuracy": 0.75139200091362, + "num_tokens": 90019554.0, + "step": 38940 + }, + { + "epoch": 0.3571101127716146, + "learning_rate": 0.0001285798111304667, + "loss": 0.8193, + "mean_token_accuracy": 0.7521109402179718, + "num_tokens": 90042731.0, + "step": 38950 + }, + { + "epoch": 0.3572017970110938, + "learning_rate": 0.00012856147428257084, + "loss": 0.8265, + "mean_token_accuracy": 0.7502789199352264, + "num_tokens": 90066579.0, + "step": 38960 + }, + { + "epoch": 0.35729348125057303, + "learning_rate": 0.00012854313743467497, + "loss": 0.8414, + "mean_token_accuracy": 0.7500373899936676, + "num_tokens": 90089836.0, + "step": 38970 + }, + { + "epoch": 0.3573851654900523, + "learning_rate": 0.00012852480058677914, + "loss": 0.8224, + "mean_token_accuracy": 0.7452053368091583, + "num_tokens": 90113076.0, + "step": 38980 + }, + { + "epoch": 0.3574768497295315, + "learning_rate": 0.00012850646373888328, + "loss": 0.8497, + "mean_token_accuracy": 0.7411587238311768, + "num_tokens": 90135710.0, + "step": 38990 + }, + { + "epoch": 0.3575685339690107, + "learning_rate": 0.00012848812689098744, + "loss": 0.8635, + "mean_token_accuracy": 0.746865326166153, + "num_tokens": 90158250.0, + "step": 39000 + }, + { + "epoch": 0.35766021820849, + "learning_rate": 0.0001284697900430916, + "loss": 0.8973, + "mean_token_accuracy": 0.7384992718696595, + "num_tokens": 90180860.0, + "step": 39010 + }, + { + "epoch": 0.3577519024479692, + "learning_rate": 0.00012845145319519575, + "loss": 0.8197, + "mean_token_accuracy": 0.7542255163192749, + "num_tokens": 90205006.0, + "step": 39020 + }, + { + "epoch": 0.3578435866874484, + "learning_rate": 0.0001284331163472999, + "loss": 0.8778, + "mean_token_accuracy": 0.7382643461227417, + "num_tokens": 90228296.0, + "step": 39030 + }, + { + "epoch": 0.3579352709269277, + "learning_rate": 0.00012841477949940405, + "loss": 0.8675, + "mean_token_accuracy": 0.7422235667705536, + "num_tokens": 90251008.0, + "step": 39040 + }, + { + "epoch": 0.35802695516640687, + "learning_rate": 0.00012839644265150822, + "loss": 0.8676, + "mean_token_accuracy": 0.7396080613136291, + "num_tokens": 90273592.0, + "step": 39050 + }, + { + "epoch": 0.3581186394058861, + "learning_rate": 0.00012837810580361235, + "loss": 0.8192, + "mean_token_accuracy": 0.7484216511249542, + "num_tokens": 90295922.0, + "step": 39060 + }, + { + "epoch": 0.35821032364536537, + "learning_rate": 0.00012835976895571652, + "loss": 0.8485, + "mean_token_accuracy": 0.7439599335193634, + "num_tokens": 90319196.0, + "step": 39070 + }, + { + "epoch": 0.3583020078848446, + "learning_rate": 0.00012834143210782069, + "loss": 0.8107, + "mean_token_accuracy": 0.7551554799079895, + "num_tokens": 90342472.0, + "step": 39080 + }, + { + "epoch": 0.3583936921243238, + "learning_rate": 0.00012832309525992482, + "loss": 0.8435, + "mean_token_accuracy": 0.7491034090518951, + "num_tokens": 90365535.0, + "step": 39090 + }, + { + "epoch": 0.35848537636380307, + "learning_rate": 0.000128304758412029, + "loss": 0.8645, + "mean_token_accuracy": 0.7451542317867279, + "num_tokens": 90389256.0, + "step": 39100 + }, + { + "epoch": 0.3585770606032823, + "learning_rate": 0.00012828642156413313, + "loss": 0.8498, + "mean_token_accuracy": 0.7479837834835052, + "num_tokens": 90412471.0, + "step": 39110 + }, + { + "epoch": 0.3586687448427615, + "learning_rate": 0.0001282680847162373, + "loss": 0.8556, + "mean_token_accuracy": 0.7468072712421417, + "num_tokens": 90435449.0, + "step": 39120 + }, + { + "epoch": 0.35876042908224076, + "learning_rate": 0.00012824974786834143, + "loss": 0.8422, + "mean_token_accuracy": 0.7487893998622894, + "num_tokens": 90458550.0, + "step": 39130 + }, + { + "epoch": 0.35885211332172, + "learning_rate": 0.0001282314110204456, + "loss": 0.8225, + "mean_token_accuracy": 0.7485275208950043, + "num_tokens": 90481708.0, + "step": 39140 + }, + { + "epoch": 0.3589437975611992, + "learning_rate": 0.00012821307417254976, + "loss": 0.8724, + "mean_token_accuracy": 0.7405048310756683, + "num_tokens": 90504383.0, + "step": 39150 + }, + { + "epoch": 0.35903548180067846, + "learning_rate": 0.0001281947373246539, + "loss": 0.8815, + "mean_token_accuracy": 0.7343416690826416, + "num_tokens": 90526789.0, + "step": 39160 + }, + { + "epoch": 0.3591271660401577, + "learning_rate": 0.00012817640047675804, + "loss": 0.8402, + "mean_token_accuracy": 0.7461209952831268, + "num_tokens": 90549569.0, + "step": 39170 + }, + { + "epoch": 0.3592188502796369, + "learning_rate": 0.0001281580636288622, + "loss": 0.8485, + "mean_token_accuracy": 0.7476036727428437, + "num_tokens": 90572528.0, + "step": 39180 + }, + { + "epoch": 0.35931053451911615, + "learning_rate": 0.00012813972678096634, + "loss": 0.8527, + "mean_token_accuracy": 0.7453954100608826, + "num_tokens": 90595236.0, + "step": 39190 + }, + { + "epoch": 0.3594022187585954, + "learning_rate": 0.0001281213899330705, + "loss": 0.8443, + "mean_token_accuracy": 0.7483029246330262, + "num_tokens": 90618319.0, + "step": 39200 + }, + { + "epoch": 0.35949390299807465, + "learning_rate": 0.00012810305308517467, + "loss": 0.8381, + "mean_token_accuracy": 0.7419435441493988, + "num_tokens": 90642358.0, + "step": 39210 + }, + { + "epoch": 0.35958558723755385, + "learning_rate": 0.0001280847162372788, + "loss": 0.824, + "mean_token_accuracy": 0.7481161892414093, + "num_tokens": 90665259.0, + "step": 39220 + }, + { + "epoch": 0.3596772714770331, + "learning_rate": 0.00012806637938938298, + "loss": 0.8651, + "mean_token_accuracy": 0.7428594410419465, + "num_tokens": 90688499.0, + "step": 39230 + }, + { + "epoch": 0.35976895571651235, + "learning_rate": 0.00012804804254148712, + "loss": 0.8357, + "mean_token_accuracy": 0.7452928125858307, + "num_tokens": 90711019.0, + "step": 39240 + }, + { + "epoch": 0.35986063995599155, + "learning_rate": 0.00012802970569359128, + "loss": 0.8387, + "mean_token_accuracy": 0.7483808994293213, + "num_tokens": 90734314.0, + "step": 39250 + }, + { + "epoch": 0.3599523241954708, + "learning_rate": 0.00012801136884569542, + "loss": 0.8577, + "mean_token_accuracy": 0.7443465471267701, + "num_tokens": 90756865.0, + "step": 39260 + }, + { + "epoch": 0.36004400843495005, + "learning_rate": 0.00012799303199779958, + "loss": 0.8498, + "mean_token_accuracy": 0.7470487833023072, + "num_tokens": 90779856.0, + "step": 39270 + }, + { + "epoch": 0.36013569267442924, + "learning_rate": 0.00012797469514990375, + "loss": 0.8442, + "mean_token_accuracy": 0.745301365852356, + "num_tokens": 90802740.0, + "step": 39280 + }, + { + "epoch": 0.3602273769139085, + "learning_rate": 0.0001279563583020079, + "loss": 0.8645, + "mean_token_accuracy": 0.7416181266307831, + "num_tokens": 90825374.0, + "step": 39290 + }, + { + "epoch": 0.36031906115338774, + "learning_rate": 0.00012793802145411205, + "loss": 0.8394, + "mean_token_accuracy": 0.7457209348678588, + "num_tokens": 90848466.0, + "step": 39300 + }, + { + "epoch": 0.360410745392867, + "learning_rate": 0.0001279196846062162, + "loss": 0.8263, + "mean_token_accuracy": 0.7445708155632019, + "num_tokens": 90871587.0, + "step": 39310 + }, + { + "epoch": 0.3605024296323462, + "learning_rate": 0.00012790134775832036, + "loss": 0.8219, + "mean_token_accuracy": 0.7543377220630646, + "num_tokens": 90894651.0, + "step": 39320 + }, + { + "epoch": 0.36059411387182544, + "learning_rate": 0.0001278830109104245, + "loss": 0.8443, + "mean_token_accuracy": 0.7494737327098846, + "num_tokens": 90916604.0, + "step": 39330 + }, + { + "epoch": 0.3606857981113047, + "learning_rate": 0.00012786467406252866, + "loss": 0.8429, + "mean_token_accuracy": 0.7450239300727844, + "num_tokens": 90940320.0, + "step": 39340 + }, + { + "epoch": 0.3607774823507839, + "learning_rate": 0.00012784633721463283, + "loss": 0.8433, + "mean_token_accuracy": 0.7413978159427643, + "num_tokens": 90963151.0, + "step": 39350 + }, + { + "epoch": 0.36086916659026314, + "learning_rate": 0.00012782800036673697, + "loss": 0.8646, + "mean_token_accuracy": 0.7412473142147065, + "num_tokens": 90985936.0, + "step": 39360 + }, + { + "epoch": 0.3609608508297424, + "learning_rate": 0.0001278096635188411, + "loss": 0.877, + "mean_token_accuracy": 0.7413740694522858, + "num_tokens": 91009272.0, + "step": 39370 + }, + { + "epoch": 0.3610525350692216, + "learning_rate": 0.00012779132667094527, + "loss": 0.8859, + "mean_token_accuracy": 0.7399205446243287, + "num_tokens": 91031775.0, + "step": 39380 + }, + { + "epoch": 0.36114421930870083, + "learning_rate": 0.0001277729898230494, + "loss": 0.8553, + "mean_token_accuracy": 0.7363078713417053, + "num_tokens": 91054082.0, + "step": 39390 + }, + { + "epoch": 0.3612359035481801, + "learning_rate": 0.0001277546529751536, + "loss": 0.8494, + "mean_token_accuracy": 0.7414499998092652, + "num_tokens": 91077776.0, + "step": 39400 + }, + { + "epoch": 0.3613275877876593, + "learning_rate": 0.00012773631612725774, + "loss": 0.8359, + "mean_token_accuracy": 0.7497224688529969, + "num_tokens": 91100582.0, + "step": 39410 + }, + { + "epoch": 0.3614192720271385, + "learning_rate": 0.00012771797927936188, + "loss": 0.8398, + "mean_token_accuracy": 0.7529937386512756, + "num_tokens": 91123815.0, + "step": 39420 + }, + { + "epoch": 0.3615109562666178, + "learning_rate": 0.00012769964243146604, + "loss": 0.8393, + "mean_token_accuracy": 0.7540438890457153, + "num_tokens": 91146444.0, + "step": 39430 + }, + { + "epoch": 0.36160264050609703, + "learning_rate": 0.00012768130558357018, + "loss": 0.8569, + "mean_token_accuracy": 0.7441222786903381, + "num_tokens": 91168597.0, + "step": 39440 + }, + { + "epoch": 0.3616943247455762, + "learning_rate": 0.00012766296873567435, + "loss": 0.8169, + "mean_token_accuracy": 0.7493405520915986, + "num_tokens": 91192109.0, + "step": 39450 + }, + { + "epoch": 0.3617860089850555, + "learning_rate": 0.00012764463188777848, + "loss": 0.9045, + "mean_token_accuracy": 0.7368192732334137, + "num_tokens": 91215439.0, + "step": 39460 + }, + { + "epoch": 0.3618776932245347, + "learning_rate": 0.00012762629503988265, + "loss": 0.8497, + "mean_token_accuracy": 0.7431175529956817, + "num_tokens": 91238840.0, + "step": 39470 + }, + { + "epoch": 0.3619693774640139, + "learning_rate": 0.00012760795819198681, + "loss": 0.8498, + "mean_token_accuracy": 0.7466048240661621, + "num_tokens": 91261077.0, + "step": 39480 + }, + { + "epoch": 0.36206106170349317, + "learning_rate": 0.00012758962134409095, + "loss": 0.8498, + "mean_token_accuracy": 0.7444063425064087, + "num_tokens": 91283721.0, + "step": 39490 + }, + { + "epoch": 0.3621527459429724, + "learning_rate": 0.00012757128449619512, + "loss": 0.8679, + "mean_token_accuracy": 0.7448558211326599, + "num_tokens": 91306497.0, + "step": 39500 + }, + { + "epoch": 0.3622444301824516, + "learning_rate": 0.00012755294764829926, + "loss": 0.8287, + "mean_token_accuracy": 0.7477375030517578, + "num_tokens": 91329031.0, + "step": 39510 + }, + { + "epoch": 0.36233611442193087, + "learning_rate": 0.00012753461080040342, + "loss": 0.852, + "mean_token_accuracy": 0.741021329164505, + "num_tokens": 91352555.0, + "step": 39520 + }, + { + "epoch": 0.3624277986614101, + "learning_rate": 0.0001275162739525076, + "loss": 0.7893, + "mean_token_accuracy": 0.7620260953903198, + "num_tokens": 91375262.0, + "step": 39530 + }, + { + "epoch": 0.3625194829008893, + "learning_rate": 0.00012749793710461173, + "loss": 0.8846, + "mean_token_accuracy": 0.7371660232543945, + "num_tokens": 91398662.0, + "step": 39540 + }, + { + "epoch": 0.36261116714036856, + "learning_rate": 0.0001274796002567159, + "loss": 0.8849, + "mean_token_accuracy": 0.7396804332733155, + "num_tokens": 91422616.0, + "step": 39550 + }, + { + "epoch": 0.3627028513798478, + "learning_rate": 0.00012746126340882003, + "loss": 0.8744, + "mean_token_accuracy": 0.7417828977108002, + "num_tokens": 91445879.0, + "step": 39560 + }, + { + "epoch": 0.36279453561932706, + "learning_rate": 0.00012744292656092417, + "loss": 0.8211, + "mean_token_accuracy": 0.7551993131637573, + "num_tokens": 91469407.0, + "step": 39570 + }, + { + "epoch": 0.36288621985880626, + "learning_rate": 0.00012742458971302833, + "loss": 0.8545, + "mean_token_accuracy": 0.7422672986984253, + "num_tokens": 91493572.0, + "step": 39580 + }, + { + "epoch": 0.3629779040982855, + "learning_rate": 0.00012740625286513247, + "loss": 0.8858, + "mean_token_accuracy": 0.7383472084999084, + "num_tokens": 91517109.0, + "step": 39590 + }, + { + "epoch": 0.36306958833776476, + "learning_rate": 0.00012738791601723666, + "loss": 0.846, + "mean_token_accuracy": 0.7447839200496673, + "num_tokens": 91540272.0, + "step": 39600 + }, + { + "epoch": 0.36316127257724395, + "learning_rate": 0.0001273695791693408, + "loss": 0.837, + "mean_token_accuracy": 0.750486308336258, + "num_tokens": 91563517.0, + "step": 39610 + }, + { + "epoch": 0.3632529568167232, + "learning_rate": 0.00012735124232144494, + "loss": 0.8292, + "mean_token_accuracy": 0.7488204300403595, + "num_tokens": 91586299.0, + "step": 39620 + }, + { + "epoch": 0.36334464105620246, + "learning_rate": 0.0001273329054735491, + "loss": 0.8614, + "mean_token_accuracy": 0.7387410640716553, + "num_tokens": 91609314.0, + "step": 39630 + }, + { + "epoch": 0.36343632529568165, + "learning_rate": 0.00012731456862565324, + "loss": 0.8755, + "mean_token_accuracy": 0.7395784020423889, + "num_tokens": 91631534.0, + "step": 39640 + }, + { + "epoch": 0.3635280095351609, + "learning_rate": 0.0001272962317777574, + "loss": 0.8138, + "mean_token_accuracy": 0.7593177497386933, + "num_tokens": 91654197.0, + "step": 39650 + }, + { + "epoch": 0.36361969377464015, + "learning_rate": 0.00012727789492986155, + "loss": 0.901, + "mean_token_accuracy": 0.7381822168827057, + "num_tokens": 91677741.0, + "step": 39660 + }, + { + "epoch": 0.36371137801411935, + "learning_rate": 0.00012725955808196571, + "loss": 0.8208, + "mean_token_accuracy": 0.7579244554042817, + "num_tokens": 91700968.0, + "step": 39670 + }, + { + "epoch": 0.3638030622535986, + "learning_rate": 0.00012724122123406988, + "loss": 0.8199, + "mean_token_accuracy": 0.7514577746391297, + "num_tokens": 91723811.0, + "step": 39680 + }, + { + "epoch": 0.36389474649307785, + "learning_rate": 0.00012722288438617402, + "loss": 0.849, + "mean_token_accuracy": 0.7445736348628997, + "num_tokens": 91747070.0, + "step": 39690 + }, + { + "epoch": 0.3639864307325571, + "learning_rate": 0.00012720454753827818, + "loss": 0.8652, + "mean_token_accuracy": 0.7425487399101257, + "num_tokens": 91770766.0, + "step": 39700 + }, + { + "epoch": 0.3640781149720363, + "learning_rate": 0.00012718621069038232, + "loss": 0.8629, + "mean_token_accuracy": 0.7428417444229126, + "num_tokens": 91793856.0, + "step": 39710 + }, + { + "epoch": 0.36416979921151554, + "learning_rate": 0.0001271678738424865, + "loss": 0.8573, + "mean_token_accuracy": 0.7450142085552216, + "num_tokens": 91816416.0, + "step": 39720 + }, + { + "epoch": 0.3642614834509948, + "learning_rate": 0.00012714953699459065, + "loss": 0.8599, + "mean_token_accuracy": 0.7451660454273223, + "num_tokens": 91839904.0, + "step": 39730 + }, + { + "epoch": 0.364353167690474, + "learning_rate": 0.0001271312001466948, + "loss": 0.8252, + "mean_token_accuracy": 0.7544918477535247, + "num_tokens": 91862889.0, + "step": 39740 + }, + { + "epoch": 0.36444485192995324, + "learning_rate": 0.00012711286329879896, + "loss": 0.8108, + "mean_token_accuracy": 0.7567556619644165, + "num_tokens": 91886440.0, + "step": 39750 + }, + { + "epoch": 0.3645365361694325, + "learning_rate": 0.0001270945264509031, + "loss": 0.8637, + "mean_token_accuracy": 0.741011118888855, + "num_tokens": 91908793.0, + "step": 39760 + }, + { + "epoch": 0.3646282204089117, + "learning_rate": 0.00012707618960300723, + "loss": 0.8299, + "mean_token_accuracy": 0.7522927403450013, + "num_tokens": 91931469.0, + "step": 39770 + }, + { + "epoch": 0.36471990464839094, + "learning_rate": 0.0001270578527551114, + "loss": 0.8267, + "mean_token_accuracy": 0.7494844019412994, + "num_tokens": 91955670.0, + "step": 39780 + }, + { + "epoch": 0.3648115888878702, + "learning_rate": 0.00012703951590721554, + "loss": 0.8347, + "mean_token_accuracy": 0.7501931846141815, + "num_tokens": 91977964.0, + "step": 39790 + }, + { + "epoch": 0.3649032731273494, + "learning_rate": 0.00012702117905931973, + "loss": 0.8576, + "mean_token_accuracy": 0.7422442376613617, + "num_tokens": 92000707.0, + "step": 39800 + }, + { + "epoch": 0.36499495736682863, + "learning_rate": 0.00012700284221142387, + "loss": 0.8159, + "mean_token_accuracy": 0.7515161991119385, + "num_tokens": 92023331.0, + "step": 39810 + }, + { + "epoch": 0.3650866416063079, + "learning_rate": 0.000126984505363528, + "loss": 0.8625, + "mean_token_accuracy": 0.7397204816341401, + "num_tokens": 92046328.0, + "step": 39820 + }, + { + "epoch": 0.36517832584578713, + "learning_rate": 0.00012696616851563217, + "loss": 0.8626, + "mean_token_accuracy": 0.7454255521297455, + "num_tokens": 92069562.0, + "step": 39830 + }, + { + "epoch": 0.36527001008526633, + "learning_rate": 0.0001269478316677363, + "loss": 0.8456, + "mean_token_accuracy": 0.747641122341156, + "num_tokens": 92091851.0, + "step": 39840 + }, + { + "epoch": 0.3653616943247456, + "learning_rate": 0.00012692949481984047, + "loss": 0.8453, + "mean_token_accuracy": 0.7518446266651153, + "num_tokens": 92115268.0, + "step": 39850 + }, + { + "epoch": 0.36545337856422483, + "learning_rate": 0.00012691115797194464, + "loss": 0.8191, + "mean_token_accuracy": 0.7559412837028503, + "num_tokens": 92138997.0, + "step": 39860 + }, + { + "epoch": 0.365545062803704, + "learning_rate": 0.00012689282112404878, + "loss": 0.8185, + "mean_token_accuracy": 0.7551422715187073, + "num_tokens": 92162308.0, + "step": 39870 + }, + { + "epoch": 0.3656367470431833, + "learning_rate": 0.00012687448427615294, + "loss": 0.8545, + "mean_token_accuracy": 0.742394644021988, + "num_tokens": 92186312.0, + "step": 39880 + }, + { + "epoch": 0.3657284312826625, + "learning_rate": 0.00012685614742825708, + "loss": 0.8675, + "mean_token_accuracy": 0.743462860584259, + "num_tokens": 92209528.0, + "step": 39890 + }, + { + "epoch": 0.3658201155221417, + "learning_rate": 0.00012683781058036125, + "loss": 0.8764, + "mean_token_accuracy": 0.7435184717178345, + "num_tokens": 92232266.0, + "step": 39900 + }, + { + "epoch": 0.36591179976162097, + "learning_rate": 0.00012681947373246539, + "loss": 0.8281, + "mean_token_accuracy": 0.7465691208839417, + "num_tokens": 92255286.0, + "step": 39910 + }, + { + "epoch": 0.3660034840011002, + "learning_rate": 0.00012680113688456955, + "loss": 0.846, + "mean_token_accuracy": 0.7478818774223328, + "num_tokens": 92278139.0, + "step": 39920 + }, + { + "epoch": 0.36609516824057947, + "learning_rate": 0.00012678280003667372, + "loss": 0.8633, + "mean_token_accuracy": 0.7438245713710785, + "num_tokens": 92301488.0, + "step": 39930 + }, + { + "epoch": 0.36618685248005867, + "learning_rate": 0.00012676446318877785, + "loss": 0.8329, + "mean_token_accuracy": 0.7494479298591614, + "num_tokens": 92324312.0, + "step": 39940 + }, + { + "epoch": 0.3662785367195379, + "learning_rate": 0.00012674612634088202, + "loss": 0.856, + "mean_token_accuracy": 0.7483045279979705, + "num_tokens": 92347224.0, + "step": 39950 + }, + { + "epoch": 0.36637022095901717, + "learning_rate": 0.00012672778949298616, + "loss": 0.8827, + "mean_token_accuracy": 0.7397355735301971, + "num_tokens": 92369762.0, + "step": 39960 + }, + { + "epoch": 0.36646190519849636, + "learning_rate": 0.0001267094526450903, + "loss": 0.838, + "mean_token_accuracy": 0.7478506326675415, + "num_tokens": 92393210.0, + "step": 39970 + }, + { + "epoch": 0.3665535894379756, + "learning_rate": 0.00012669111579719446, + "loss": 0.8243, + "mean_token_accuracy": 0.7567574977874756, + "num_tokens": 92416100.0, + "step": 39980 + }, + { + "epoch": 0.36664527367745486, + "learning_rate": 0.00012667277894929863, + "loss": 0.8177, + "mean_token_accuracy": 0.7546796023845672, + "num_tokens": 92439552.0, + "step": 39990 + }, + { + "epoch": 0.36673695791693406, + "learning_rate": 0.0001266544421014028, + "loss": 0.8345, + "mean_token_accuracy": 0.7529680073261261, + "num_tokens": 92462410.0, + "step": 40000 + }, + { + "epoch": 0.3668286421564133, + "learning_rate": 0.00012663610525350693, + "loss": 0.846, + "mean_token_accuracy": 0.7406797587871552, + "num_tokens": 92485957.0, + "step": 40010 + }, + { + "epoch": 0.36692032639589256, + "learning_rate": 0.00012661776840561107, + "loss": 0.8346, + "mean_token_accuracy": 0.7488115429878235, + "num_tokens": 92508695.0, + "step": 40020 + }, + { + "epoch": 0.36701201063537175, + "learning_rate": 0.00012659943155771524, + "loss": 0.8482, + "mean_token_accuracy": 0.7431809842586518, + "num_tokens": 92532395.0, + "step": 40030 + }, + { + "epoch": 0.367103694874851, + "learning_rate": 0.00012658109470981937, + "loss": 0.8305, + "mean_token_accuracy": 0.7561107218265534, + "num_tokens": 92555286.0, + "step": 40040 + }, + { + "epoch": 0.36719537911433026, + "learning_rate": 0.00012656275786192354, + "loss": 0.8408, + "mean_token_accuracy": 0.7459770798683166, + "num_tokens": 92577634.0, + "step": 40050 + }, + { + "epoch": 0.3672870633538095, + "learning_rate": 0.0001265444210140277, + "loss": 0.8849, + "mean_token_accuracy": 0.7432604789733886, + "num_tokens": 92600191.0, + "step": 40060 + }, + { + "epoch": 0.3673787475932887, + "learning_rate": 0.00012652608416613184, + "loss": 0.8035, + "mean_token_accuracy": 0.7561726629734039, + "num_tokens": 92623965.0, + "step": 40070 + }, + { + "epoch": 0.36747043183276795, + "learning_rate": 0.000126507747318236, + "loss": 0.8311, + "mean_token_accuracy": 0.7523778915405274, + "num_tokens": 92647741.0, + "step": 40080 + }, + { + "epoch": 0.3675621160722472, + "learning_rate": 0.00012648941047034015, + "loss": 0.821, + "mean_token_accuracy": 0.7464438676834106, + "num_tokens": 92670825.0, + "step": 40090 + }, + { + "epoch": 0.3676538003117264, + "learning_rate": 0.0001264710736224443, + "loss": 0.8582, + "mean_token_accuracy": 0.7455631375312806, + "num_tokens": 92693320.0, + "step": 40100 + }, + { + "epoch": 0.36774548455120565, + "learning_rate": 0.00012645273677454845, + "loss": 0.7979, + "mean_token_accuracy": 0.7619030833244324, + "num_tokens": 92715172.0, + "step": 40110 + }, + { + "epoch": 0.3678371687906849, + "learning_rate": 0.00012643439992665262, + "loss": 0.8307, + "mean_token_accuracy": 0.7564894676208496, + "num_tokens": 92738453.0, + "step": 40120 + }, + { + "epoch": 0.3679288530301641, + "learning_rate": 0.00012641606307875678, + "loss": 0.8251, + "mean_token_accuracy": 0.7496735274791717, + "num_tokens": 92761941.0, + "step": 40130 + }, + { + "epoch": 0.36802053726964334, + "learning_rate": 0.00012639772623086092, + "loss": 0.8662, + "mean_token_accuracy": 0.7428528904914856, + "num_tokens": 92784551.0, + "step": 40140 + }, + { + "epoch": 0.3681122215091226, + "learning_rate": 0.00012637938938296508, + "loss": 0.8338, + "mean_token_accuracy": 0.7540151894092559, + "num_tokens": 92806983.0, + "step": 40150 + }, + { + "epoch": 0.3682039057486018, + "learning_rate": 0.00012636105253506922, + "loss": 0.8424, + "mean_token_accuracy": 0.7459520876407624, + "num_tokens": 92829925.0, + "step": 40160 + }, + { + "epoch": 0.36829558998808104, + "learning_rate": 0.00012634271568717336, + "loss": 0.8298, + "mean_token_accuracy": 0.7497051417827606, + "num_tokens": 92853052.0, + "step": 40170 + }, + { + "epoch": 0.3683872742275603, + "learning_rate": 0.00012632437883927753, + "loss": 0.8425, + "mean_token_accuracy": 0.7553964674472808, + "num_tokens": 92875672.0, + "step": 40180 + }, + { + "epoch": 0.36847895846703954, + "learning_rate": 0.0001263060419913817, + "loss": 0.8324, + "mean_token_accuracy": 0.7483945846557617, + "num_tokens": 92898021.0, + "step": 40190 + }, + { + "epoch": 0.36857064270651874, + "learning_rate": 0.00012628770514348586, + "loss": 0.7824, + "mean_token_accuracy": 0.7633194088935852, + "num_tokens": 92921031.0, + "step": 40200 + }, + { + "epoch": 0.368662326945998, + "learning_rate": 0.00012626936829559, + "loss": 0.8493, + "mean_token_accuracy": 0.7487386226654053, + "num_tokens": 92943211.0, + "step": 40210 + }, + { + "epoch": 0.36875401118547724, + "learning_rate": 0.00012625103144769413, + "loss": 0.8353, + "mean_token_accuracy": 0.7439074158668518, + "num_tokens": 92965929.0, + "step": 40220 + }, + { + "epoch": 0.36884569542495643, + "learning_rate": 0.0001262326945997983, + "loss": 0.8342, + "mean_token_accuracy": 0.7512854933738708, + "num_tokens": 92989508.0, + "step": 40230 + }, + { + "epoch": 0.3689373796644357, + "learning_rate": 0.00012621435775190244, + "loss": 0.8629, + "mean_token_accuracy": 0.7368911981582642, + "num_tokens": 93012147.0, + "step": 40240 + }, + { + "epoch": 0.36902906390391493, + "learning_rate": 0.00012619602090400663, + "loss": 0.8342, + "mean_token_accuracy": 0.7457172989845275, + "num_tokens": 93035091.0, + "step": 40250 + }, + { + "epoch": 0.36912074814339413, + "learning_rate": 0.00012617768405611077, + "loss": 0.8514, + "mean_token_accuracy": 0.7521363794803619, + "num_tokens": 93058530.0, + "step": 40260 + }, + { + "epoch": 0.3692124323828734, + "learning_rate": 0.0001261593472082149, + "loss": 0.813, + "mean_token_accuracy": 0.7531933188438416, + "num_tokens": 93081509.0, + "step": 40270 + }, + { + "epoch": 0.36930411662235263, + "learning_rate": 0.00012614101036031907, + "loss": 0.8282, + "mean_token_accuracy": 0.7440933346748352, + "num_tokens": 93103968.0, + "step": 40280 + }, + { + "epoch": 0.3693958008618318, + "learning_rate": 0.0001261226735124232, + "loss": 0.8138, + "mean_token_accuracy": 0.753024297952652, + "num_tokens": 93126975.0, + "step": 40290 + }, + { + "epoch": 0.3694874851013111, + "learning_rate": 0.00012610433666452738, + "loss": 0.8427, + "mean_token_accuracy": 0.7481602966785431, + "num_tokens": 93150114.0, + "step": 40300 + }, + { + "epoch": 0.3695791693407903, + "learning_rate": 0.00012608599981663151, + "loss": 0.9202, + "mean_token_accuracy": 0.7269593954086304, + "num_tokens": 93173992.0, + "step": 40310 + }, + { + "epoch": 0.3696708535802696, + "learning_rate": 0.00012606766296873568, + "loss": 0.8513, + "mean_token_accuracy": 0.7426384091377258, + "num_tokens": 93197403.0, + "step": 40320 + }, + { + "epoch": 0.36976253781974877, + "learning_rate": 0.00012604932612083985, + "loss": 0.859, + "mean_token_accuracy": 0.7421603322029113, + "num_tokens": 93220655.0, + "step": 40330 + }, + { + "epoch": 0.369854222059228, + "learning_rate": 0.00012603098927294398, + "loss": 0.8047, + "mean_token_accuracy": 0.7526649475097656, + "num_tokens": 93243287.0, + "step": 40340 + }, + { + "epoch": 0.36994590629870727, + "learning_rate": 0.00012601265242504815, + "loss": 0.8612, + "mean_token_accuracy": 0.747111189365387, + "num_tokens": 93266655.0, + "step": 40350 + }, + { + "epoch": 0.37003759053818647, + "learning_rate": 0.0001259943155771523, + "loss": 0.862, + "mean_token_accuracy": 0.7481015443801879, + "num_tokens": 93289581.0, + "step": 40360 + }, + { + "epoch": 0.3701292747776657, + "learning_rate": 0.00012597597872925643, + "loss": 0.8106, + "mean_token_accuracy": 0.7533900260925293, + "num_tokens": 93312663.0, + "step": 40370 + }, + { + "epoch": 0.37022095901714497, + "learning_rate": 0.00012595764188136062, + "loss": 0.8559, + "mean_token_accuracy": 0.7490554809570312, + "num_tokens": 93335413.0, + "step": 40380 + }, + { + "epoch": 0.37031264325662416, + "learning_rate": 0.00012593930503346476, + "loss": 0.8592, + "mean_token_accuracy": 0.7416788399219513, + "num_tokens": 93358953.0, + "step": 40390 + }, + { + "epoch": 0.3704043274961034, + "learning_rate": 0.00012592096818556892, + "loss": 0.833, + "mean_token_accuracy": 0.744015908241272, + "num_tokens": 93382002.0, + "step": 40400 + }, + { + "epoch": 0.37049601173558266, + "learning_rate": 0.00012590263133767306, + "loss": 0.8255, + "mean_token_accuracy": 0.75286785364151, + "num_tokens": 93405306.0, + "step": 40410 + }, + { + "epoch": 0.37058769597506186, + "learning_rate": 0.0001258842944897772, + "loss": 0.8513, + "mean_token_accuracy": 0.7488247215747833, + "num_tokens": 93429457.0, + "step": 40420 + }, + { + "epoch": 0.3706793802145411, + "learning_rate": 0.00012586595764188136, + "loss": 0.8315, + "mean_token_accuracy": 0.7498377323150635, + "num_tokens": 93452354.0, + "step": 40430 + }, + { + "epoch": 0.37077106445402036, + "learning_rate": 0.0001258476207939855, + "loss": 0.871, + "mean_token_accuracy": 0.7410698115825654, + "num_tokens": 93474616.0, + "step": 40440 + }, + { + "epoch": 0.3708627486934996, + "learning_rate": 0.0001258292839460897, + "loss": 0.8004, + "mean_token_accuracy": 0.7547740161418914, + "num_tokens": 93498594.0, + "step": 40450 + }, + { + "epoch": 0.3709544329329788, + "learning_rate": 0.00012581094709819383, + "loss": 0.8481, + "mean_token_accuracy": 0.7415642082691193, + "num_tokens": 93521499.0, + "step": 40460 + }, + { + "epoch": 0.37104611717245806, + "learning_rate": 0.00012579261025029797, + "loss": 0.8715, + "mean_token_accuracy": 0.7353518903255463, + "num_tokens": 93544054.0, + "step": 40470 + }, + { + "epoch": 0.3711378014119373, + "learning_rate": 0.00012577427340240214, + "loss": 0.8521, + "mean_token_accuracy": 0.7446906924247741, + "num_tokens": 93567225.0, + "step": 40480 + }, + { + "epoch": 0.3712294856514165, + "learning_rate": 0.00012575593655450628, + "loss": 0.8502, + "mean_token_accuracy": 0.7465663194656372, + "num_tokens": 93590500.0, + "step": 40490 + }, + { + "epoch": 0.37132116989089575, + "learning_rate": 0.00012573759970661044, + "loss": 0.8437, + "mean_token_accuracy": 0.7428981006145478, + "num_tokens": 93613735.0, + "step": 40500 + }, + { + "epoch": 0.371412854130375, + "learning_rate": 0.0001257192628587146, + "loss": 0.8992, + "mean_token_accuracy": 0.7355528891086578, + "num_tokens": 93637224.0, + "step": 40510 + }, + { + "epoch": 0.3715045383698542, + "learning_rate": 0.00012570092601081874, + "loss": 0.853, + "mean_token_accuracy": 0.742870831489563, + "num_tokens": 93660064.0, + "step": 40520 + }, + { + "epoch": 0.37159622260933345, + "learning_rate": 0.0001256825891629229, + "loss": 0.8017, + "mean_token_accuracy": 0.7555842518806457, + "num_tokens": 93683197.0, + "step": 40530 + }, + { + "epoch": 0.3716879068488127, + "learning_rate": 0.00012566425231502705, + "loss": 0.8352, + "mean_token_accuracy": 0.7442308604717255, + "num_tokens": 93706907.0, + "step": 40540 + }, + { + "epoch": 0.37177959108829195, + "learning_rate": 0.0001256459154671312, + "loss": 0.8294, + "mean_token_accuracy": 0.7532436072826385, + "num_tokens": 93730090.0, + "step": 40550 + }, + { + "epoch": 0.37187127532777114, + "learning_rate": 0.00012562757861923535, + "loss": 0.8732, + "mean_token_accuracy": 0.7416025876998902, + "num_tokens": 93753397.0, + "step": 40560 + }, + { + "epoch": 0.3719629595672504, + "learning_rate": 0.0001256092417713395, + "loss": 0.8535, + "mean_token_accuracy": 0.7419710040092469, + "num_tokens": 93776825.0, + "step": 40570 + }, + { + "epoch": 0.37205464380672965, + "learning_rate": 0.00012559090492344368, + "loss": 0.863, + "mean_token_accuracy": 0.7388189852237701, + "num_tokens": 93800186.0, + "step": 40580 + }, + { + "epoch": 0.37214632804620884, + "learning_rate": 0.00012557256807554782, + "loss": 0.8313, + "mean_token_accuracy": 0.7578201413154602, + "num_tokens": 93823162.0, + "step": 40590 + }, + { + "epoch": 0.3722380122856881, + "learning_rate": 0.00012555423122765199, + "loss": 0.8293, + "mean_token_accuracy": 0.7469756484031678, + "num_tokens": 93846024.0, + "step": 40600 + }, + { + "epoch": 0.37232969652516734, + "learning_rate": 0.00012553589437975612, + "loss": 0.8495, + "mean_token_accuracy": 0.7459544360637664, + "num_tokens": 93869454.0, + "step": 40610 + }, + { + "epoch": 0.37242138076464654, + "learning_rate": 0.00012551755753186026, + "loss": 0.8485, + "mean_token_accuracy": 0.7407496690750122, + "num_tokens": 93892403.0, + "step": 40620 + }, + { + "epoch": 0.3725130650041258, + "learning_rate": 0.00012549922068396443, + "loss": 0.8914, + "mean_token_accuracy": 0.7309635579586029, + "num_tokens": 93915122.0, + "step": 40630 + }, + { + "epoch": 0.37260474924360504, + "learning_rate": 0.0001254808838360686, + "loss": 0.8264, + "mean_token_accuracy": 0.7473390102386475, + "num_tokens": 93938613.0, + "step": 40640 + }, + { + "epoch": 0.37269643348308423, + "learning_rate": 0.00012546254698817276, + "loss": 0.8518, + "mean_token_accuracy": 0.748279732465744, + "num_tokens": 93961859.0, + "step": 40650 + }, + { + "epoch": 0.3727881177225635, + "learning_rate": 0.0001254442101402769, + "loss": 0.8539, + "mean_token_accuracy": 0.7445384502410889, + "num_tokens": 93984682.0, + "step": 40660 + }, + { + "epoch": 0.37287980196204273, + "learning_rate": 0.00012542587329238104, + "loss": 0.8455, + "mean_token_accuracy": 0.7497119009494781, + "num_tokens": 94007612.0, + "step": 40670 + }, + { + "epoch": 0.372971486201522, + "learning_rate": 0.0001254075364444852, + "loss": 0.8628, + "mean_token_accuracy": 0.7399684607982635, + "num_tokens": 94030804.0, + "step": 40680 + }, + { + "epoch": 0.3730631704410012, + "learning_rate": 0.00012538919959658934, + "loss": 0.8404, + "mean_token_accuracy": 0.7462611377239228, + "num_tokens": 94054300.0, + "step": 40690 + }, + { + "epoch": 0.37315485468048043, + "learning_rate": 0.0001253708627486935, + "loss": 0.8748, + "mean_token_accuracy": 0.7407118141651153, + "num_tokens": 94077828.0, + "step": 40700 + }, + { + "epoch": 0.3732465389199597, + "learning_rate": 0.00012535252590079767, + "loss": 0.8618, + "mean_token_accuracy": 0.7392879724502563, + "num_tokens": 94100971.0, + "step": 40710 + }, + { + "epoch": 0.3733382231594389, + "learning_rate": 0.0001253341890529018, + "loss": 0.8399, + "mean_token_accuracy": 0.7479075014591217, + "num_tokens": 94124078.0, + "step": 40720 + }, + { + "epoch": 0.3734299073989181, + "learning_rate": 0.00012531585220500597, + "loss": 0.8186, + "mean_token_accuracy": 0.7510039865970611, + "num_tokens": 94147238.0, + "step": 40730 + }, + { + "epoch": 0.3735215916383974, + "learning_rate": 0.0001252975153571101, + "loss": 0.8604, + "mean_token_accuracy": 0.741525012254715, + "num_tokens": 94170910.0, + "step": 40740 + }, + { + "epoch": 0.37361327587787657, + "learning_rate": 0.00012527917850921428, + "loss": 0.8155, + "mean_token_accuracy": 0.756772369146347, + "num_tokens": 94194339.0, + "step": 40750 + }, + { + "epoch": 0.3737049601173558, + "learning_rate": 0.00012526084166131842, + "loss": 0.8514, + "mean_token_accuracy": 0.74683518409729, + "num_tokens": 94217202.0, + "step": 40760 + }, + { + "epoch": 0.3737966443568351, + "learning_rate": 0.00012524250481342255, + "loss": 0.8497, + "mean_token_accuracy": 0.7476775407791137, + "num_tokens": 94239737.0, + "step": 40770 + }, + { + "epoch": 0.37388832859631427, + "learning_rate": 0.00012522416796552675, + "loss": 0.8581, + "mean_token_accuracy": 0.7390937447547913, + "num_tokens": 94262098.0, + "step": 40780 + }, + { + "epoch": 0.3739800128357935, + "learning_rate": 0.00012520583111763089, + "loss": 0.8444, + "mean_token_accuracy": 0.7504557430744171, + "num_tokens": 94285742.0, + "step": 40790 + }, + { + "epoch": 0.37407169707527277, + "learning_rate": 0.00012518749426973505, + "loss": 0.8141, + "mean_token_accuracy": 0.755222475528717, + "num_tokens": 94308696.0, + "step": 40800 + }, + { + "epoch": 0.374163381314752, + "learning_rate": 0.0001251691574218392, + "loss": 0.8436, + "mean_token_accuracy": 0.7472757160663605, + "num_tokens": 94331831.0, + "step": 40810 + }, + { + "epoch": 0.3742550655542312, + "learning_rate": 0.00012515082057394333, + "loss": 0.8492, + "mean_token_accuracy": 0.7493879616260528, + "num_tokens": 94355344.0, + "step": 40820 + }, + { + "epoch": 0.37434674979371046, + "learning_rate": 0.0001251324837260475, + "loss": 0.8484, + "mean_token_accuracy": 0.7448008000850678, + "num_tokens": 94377772.0, + "step": 40830 + }, + { + "epoch": 0.3744384340331897, + "learning_rate": 0.00012511414687815166, + "loss": 0.8664, + "mean_token_accuracy": 0.7426619470119477, + "num_tokens": 94400584.0, + "step": 40840 + }, + { + "epoch": 0.3745301182726689, + "learning_rate": 0.00012509581003025582, + "loss": 0.8652, + "mean_token_accuracy": 0.7521373689174652, + "num_tokens": 94423858.0, + "step": 40850 + }, + { + "epoch": 0.37462180251214816, + "learning_rate": 0.00012507747318235996, + "loss": 0.8404, + "mean_token_accuracy": 0.7479946434497833, + "num_tokens": 94447180.0, + "step": 40860 + }, + { + "epoch": 0.3747134867516274, + "learning_rate": 0.0001250591363344641, + "loss": 0.8649, + "mean_token_accuracy": 0.7471463203430175, + "num_tokens": 94469854.0, + "step": 40870 + }, + { + "epoch": 0.3748051709911066, + "learning_rate": 0.00012504079948656827, + "loss": 0.8443, + "mean_token_accuracy": 0.7519271194934845, + "num_tokens": 94492674.0, + "step": 40880 + }, + { + "epoch": 0.37489685523058586, + "learning_rate": 0.0001250224626386724, + "loss": 0.8688, + "mean_token_accuracy": 0.738123744726181, + "num_tokens": 94515867.0, + "step": 40890 + }, + { + "epoch": 0.3749885394700651, + "learning_rate": 0.00012500412579077657, + "loss": 0.8469, + "mean_token_accuracy": 0.7527352869510651, + "num_tokens": 94539391.0, + "step": 40900 + }, + { + "epoch": 0.3750802237095443, + "learning_rate": 0.00012498578894288073, + "loss": 0.8203, + "mean_token_accuracy": 0.7547052025794982, + "num_tokens": 94562710.0, + "step": 40910 + }, + { + "epoch": 0.37517190794902355, + "learning_rate": 0.00012496745209498487, + "loss": 0.8207, + "mean_token_accuracy": 0.7532356142997741, + "num_tokens": 94585833.0, + "step": 40920 + }, + { + "epoch": 0.3752635921885028, + "learning_rate": 0.00012494911524708904, + "loss": 0.8252, + "mean_token_accuracy": 0.7508581697940826, + "num_tokens": 94608891.0, + "step": 40930 + }, + { + "epoch": 0.37535527642798205, + "learning_rate": 0.00012493077839919318, + "loss": 0.8069, + "mean_token_accuracy": 0.7545634806156158, + "num_tokens": 94632468.0, + "step": 40940 + }, + { + "epoch": 0.37544696066746125, + "learning_rate": 0.00012491244155129734, + "loss": 0.8566, + "mean_token_accuracy": 0.7451045572757721, + "num_tokens": 94655745.0, + "step": 40950 + }, + { + "epoch": 0.3755386449069405, + "learning_rate": 0.00012489410470340148, + "loss": 0.8644, + "mean_token_accuracy": 0.7480914235115051, + "num_tokens": 94679039.0, + "step": 40960 + }, + { + "epoch": 0.37563032914641975, + "learning_rate": 0.00012487576785550565, + "loss": 0.835, + "mean_token_accuracy": 0.7503280758857727, + "num_tokens": 94701980.0, + "step": 40970 + }, + { + "epoch": 0.37572201338589895, + "learning_rate": 0.0001248574310076098, + "loss": 0.8683, + "mean_token_accuracy": 0.7421993672847748, + "num_tokens": 94724636.0, + "step": 40980 + }, + { + "epoch": 0.3758136976253782, + "learning_rate": 0.00012483909415971395, + "loss": 0.8698, + "mean_token_accuracy": 0.7421487331390381, + "num_tokens": 94747249.0, + "step": 40990 + }, + { + "epoch": 0.37590538186485745, + "learning_rate": 0.00012482075731181812, + "loss": 0.8223, + "mean_token_accuracy": 0.7498030722141266, + "num_tokens": 94770674.0, + "step": 41000 + }, + { + "epoch": 0.37599706610433664, + "learning_rate": 0.00012480242046392225, + "loss": 0.8823, + "mean_token_accuracy": 0.7403291165828705, + "num_tokens": 94792841.0, + "step": 41010 + }, + { + "epoch": 0.3760887503438159, + "learning_rate": 0.0001247840836160264, + "loss": 0.848, + "mean_token_accuracy": 0.7503290355205536, + "num_tokens": 94816525.0, + "step": 41020 + }, + { + "epoch": 0.37618043458329514, + "learning_rate": 0.00012476574676813056, + "loss": 0.8758, + "mean_token_accuracy": 0.7423287034034729, + "num_tokens": 94839607.0, + "step": 41030 + }, + { + "epoch": 0.37627211882277434, + "learning_rate": 0.00012474740992023472, + "loss": 0.8336, + "mean_token_accuracy": 0.7480650782585144, + "num_tokens": 94862380.0, + "step": 41040 + }, + { + "epoch": 0.3763638030622536, + "learning_rate": 0.0001247290730723389, + "loss": 0.8816, + "mean_token_accuracy": 0.7368262827396392, + "num_tokens": 94884977.0, + "step": 41050 + }, + { + "epoch": 0.37645548730173284, + "learning_rate": 0.00012471073622444303, + "loss": 0.8737, + "mean_token_accuracy": 0.7356580853462219, + "num_tokens": 94907461.0, + "step": 41060 + }, + { + "epoch": 0.3765471715412121, + "learning_rate": 0.00012469239937654716, + "loss": 0.8217, + "mean_token_accuracy": 0.7550493061542511, + "num_tokens": 94930311.0, + "step": 41070 + }, + { + "epoch": 0.3766388557806913, + "learning_rate": 0.00012467406252865133, + "loss": 0.7902, + "mean_token_accuracy": 0.7596096932888031, + "num_tokens": 94954141.0, + "step": 41080 + }, + { + "epoch": 0.37673054002017053, + "learning_rate": 0.00012465572568075547, + "loss": 0.7835, + "mean_token_accuracy": 0.7641208648681641, + "num_tokens": 94977436.0, + "step": 41090 + }, + { + "epoch": 0.3768222242596498, + "learning_rate": 0.00012463738883285963, + "loss": 0.9044, + "mean_token_accuracy": 0.7317468404769898, + "num_tokens": 95000214.0, + "step": 41100 + }, + { + "epoch": 0.376913908499129, + "learning_rate": 0.0001246190519849638, + "loss": 0.8658, + "mean_token_accuracy": 0.7414962947368622, + "num_tokens": 95023249.0, + "step": 41110 + }, + { + "epoch": 0.37700559273860823, + "learning_rate": 0.00012460071513706794, + "loss": 0.8281, + "mean_token_accuracy": 0.7514614582061767, + "num_tokens": 95047427.0, + "step": 41120 + }, + { + "epoch": 0.3770972769780875, + "learning_rate": 0.0001245823782891721, + "loss": 0.8769, + "mean_token_accuracy": 0.746800833940506, + "num_tokens": 95070850.0, + "step": 41130 + }, + { + "epoch": 0.3771889612175667, + "learning_rate": 0.00012456404144127624, + "loss": 0.8292, + "mean_token_accuracy": 0.7497871875762939, + "num_tokens": 95094166.0, + "step": 41140 + }, + { + "epoch": 0.3772806454570459, + "learning_rate": 0.0001245457045933804, + "loss": 0.8387, + "mean_token_accuracy": 0.7449946641921997, + "num_tokens": 95117487.0, + "step": 41150 + }, + { + "epoch": 0.3773723296965252, + "learning_rate": 0.00012452736774548455, + "loss": 0.7937, + "mean_token_accuracy": 0.7537588477134705, + "num_tokens": 95139646.0, + "step": 41160 + }, + { + "epoch": 0.3774640139360044, + "learning_rate": 0.0001245090308975887, + "loss": 0.8948, + "mean_token_accuracy": 0.7397721230983734, + "num_tokens": 95162508.0, + "step": 41170 + }, + { + "epoch": 0.3775556981754836, + "learning_rate": 0.00012449069404969288, + "loss": 0.8645, + "mean_token_accuracy": 0.7402627348899842, + "num_tokens": 95186041.0, + "step": 41180 + }, + { + "epoch": 0.3776473824149629, + "learning_rate": 0.00012447235720179701, + "loss": 0.8489, + "mean_token_accuracy": 0.7446037411689759, + "num_tokens": 95209303.0, + "step": 41190 + }, + { + "epoch": 0.3777390666544421, + "learning_rate": 0.00012445402035390118, + "loss": 0.8362, + "mean_token_accuracy": 0.7498924195766449, + "num_tokens": 95231958.0, + "step": 41200 + }, + { + "epoch": 0.3778307508939213, + "learning_rate": 0.00012443568350600532, + "loss": 0.8527, + "mean_token_accuracy": 0.7455955564975738, + "num_tokens": 95255840.0, + "step": 41210 + }, + { + "epoch": 0.37792243513340057, + "learning_rate": 0.00012441734665810946, + "loss": 0.8261, + "mean_token_accuracy": 0.7489126145839691, + "num_tokens": 95277953.0, + "step": 41220 + }, + { + "epoch": 0.3780141193728798, + "learning_rate": 0.00012439900981021365, + "loss": 0.8429, + "mean_token_accuracy": 0.7478990614414215, + "num_tokens": 95300794.0, + "step": 41230 + }, + { + "epoch": 0.378105803612359, + "learning_rate": 0.0001243806729623178, + "loss": 0.8459, + "mean_token_accuracy": 0.7479574739933014, + "num_tokens": 95324437.0, + "step": 41240 + }, + { + "epoch": 0.37819748785183827, + "learning_rate": 0.00012436233611442195, + "loss": 0.8491, + "mean_token_accuracy": 0.7490546584129334, + "num_tokens": 95347068.0, + "step": 41250 + }, + { + "epoch": 0.3782891720913175, + "learning_rate": 0.0001243439992665261, + "loss": 0.8327, + "mean_token_accuracy": 0.7576212704181671, + "num_tokens": 95370337.0, + "step": 41260 + }, + { + "epoch": 0.3783808563307967, + "learning_rate": 0.00012432566241863023, + "loss": 0.8434, + "mean_token_accuracy": 0.7524004936218261, + "num_tokens": 95392832.0, + "step": 41270 + }, + { + "epoch": 0.37847254057027596, + "learning_rate": 0.0001243073255707344, + "loss": 0.8465, + "mean_token_accuracy": 0.7434422254562378, + "num_tokens": 95415356.0, + "step": 41280 + }, + { + "epoch": 0.3785642248097552, + "learning_rate": 0.00012428898872283853, + "loss": 0.8459, + "mean_token_accuracy": 0.7438011527061462, + "num_tokens": 95438070.0, + "step": 41290 + }, + { + "epoch": 0.37865590904923446, + "learning_rate": 0.0001242706518749427, + "loss": 0.828, + "mean_token_accuracy": 0.750016987323761, + "num_tokens": 95460620.0, + "step": 41300 + }, + { + "epoch": 0.37874759328871366, + "learning_rate": 0.00012425231502704686, + "loss": 0.8719, + "mean_token_accuracy": 0.7443816423416137, + "num_tokens": 95483925.0, + "step": 41310 + }, + { + "epoch": 0.3788392775281929, + "learning_rate": 0.000124233978179151, + "loss": 0.8584, + "mean_token_accuracy": 0.7468372225761414, + "num_tokens": 95507638.0, + "step": 41320 + }, + { + "epoch": 0.37893096176767216, + "learning_rate": 0.00012421564133125517, + "loss": 0.8663, + "mean_token_accuracy": 0.7462254405021668, + "num_tokens": 95530682.0, + "step": 41330 + }, + { + "epoch": 0.37902264600715135, + "learning_rate": 0.0001241973044833593, + "loss": 0.8772, + "mean_token_accuracy": 0.7407940268516541, + "num_tokens": 95553642.0, + "step": 41340 + }, + { + "epoch": 0.3791143302466306, + "learning_rate": 0.00012417896763546347, + "loss": 0.8379, + "mean_token_accuracy": 0.7433828294277192, + "num_tokens": 95576261.0, + "step": 41350 + }, + { + "epoch": 0.37920601448610985, + "learning_rate": 0.00012416063078756764, + "loss": 0.8466, + "mean_token_accuracy": 0.7472116649150848, + "num_tokens": 95599140.0, + "step": 41360 + }, + { + "epoch": 0.37929769872558905, + "learning_rate": 0.00012414229393967177, + "loss": 0.8284, + "mean_token_accuracy": 0.747962474822998, + "num_tokens": 95622279.0, + "step": 41370 + }, + { + "epoch": 0.3793893829650683, + "learning_rate": 0.00012412395709177594, + "loss": 0.8466, + "mean_token_accuracy": 0.7496549546718597, + "num_tokens": 95645558.0, + "step": 41380 + }, + { + "epoch": 0.37948106720454755, + "learning_rate": 0.00012410562024388008, + "loss": 0.8786, + "mean_token_accuracy": 0.7420814752578735, + "num_tokens": 95669066.0, + "step": 41390 + }, + { + "epoch": 0.37957275144402675, + "learning_rate": 0.00012408728339598424, + "loss": 0.8305, + "mean_token_accuracy": 0.75220627784729, + "num_tokens": 95692111.0, + "step": 41400 + }, + { + "epoch": 0.379664435683506, + "learning_rate": 0.00012406894654808838, + "loss": 0.8597, + "mean_token_accuracy": 0.7449198603630066, + "num_tokens": 95715528.0, + "step": 41410 + }, + { + "epoch": 0.37975611992298525, + "learning_rate": 0.00012405060970019252, + "loss": 0.867, + "mean_token_accuracy": 0.7405585646629333, + "num_tokens": 95738027.0, + "step": 41420 + }, + { + "epoch": 0.3798478041624645, + "learning_rate": 0.0001240322728522967, + "loss": 0.8591, + "mean_token_accuracy": 0.7457330167293549, + "num_tokens": 95760789.0, + "step": 41430 + }, + { + "epoch": 0.3799394884019437, + "learning_rate": 0.00012401393600440085, + "loss": 0.8421, + "mean_token_accuracy": 0.7469176411628723, + "num_tokens": 95784396.0, + "step": 41440 + }, + { + "epoch": 0.38003117264142294, + "learning_rate": 0.00012399559915650502, + "loss": 0.8676, + "mean_token_accuracy": 0.7385257601737976, + "num_tokens": 95807642.0, + "step": 41450 + }, + { + "epoch": 0.3801228568809022, + "learning_rate": 0.00012397726230860916, + "loss": 0.8541, + "mean_token_accuracy": 0.7452293395996094, + "num_tokens": 95831408.0, + "step": 41460 + }, + { + "epoch": 0.3802145411203814, + "learning_rate": 0.0001239589254607133, + "loss": 0.8728, + "mean_token_accuracy": 0.7429750680923461, + "num_tokens": 95853824.0, + "step": 41470 + }, + { + "epoch": 0.38030622535986064, + "learning_rate": 0.00012394058861281746, + "loss": 0.8191, + "mean_token_accuracy": 0.7523462414741516, + "num_tokens": 95876263.0, + "step": 41480 + }, + { + "epoch": 0.3803979095993399, + "learning_rate": 0.00012392225176492162, + "loss": 0.8441, + "mean_token_accuracy": 0.7436273038387299, + "num_tokens": 95898382.0, + "step": 41490 + }, + { + "epoch": 0.3804895938388191, + "learning_rate": 0.00012390391491702576, + "loss": 0.8362, + "mean_token_accuracy": 0.7424362659454345, + "num_tokens": 95921189.0, + "step": 41500 + }, + { + "epoch": 0.38058127807829834, + "learning_rate": 0.00012388557806912993, + "loss": 0.8746, + "mean_token_accuracy": 0.7430182814598083, + "num_tokens": 95944401.0, + "step": 41510 + }, + { + "epoch": 0.3806729623177776, + "learning_rate": 0.00012386724122123407, + "loss": 0.8622, + "mean_token_accuracy": 0.7408500671386719, + "num_tokens": 95968077.0, + "step": 41520 + }, + { + "epoch": 0.3807646465572568, + "learning_rate": 0.00012384890437333823, + "loss": 0.8196, + "mean_token_accuracy": 0.7536414504051209, + "num_tokens": 95991717.0, + "step": 41530 + }, + { + "epoch": 0.38085633079673603, + "learning_rate": 0.00012383056752544237, + "loss": 0.8523, + "mean_token_accuracy": 0.745907062292099, + "num_tokens": 96014936.0, + "step": 41540 + }, + { + "epoch": 0.3809480150362153, + "learning_rate": 0.00012381223067754654, + "loss": 0.8658, + "mean_token_accuracy": 0.7377768397331238, + "num_tokens": 96038452.0, + "step": 41550 + }, + { + "epoch": 0.38103969927569453, + "learning_rate": 0.0001237938938296507, + "loss": 0.8583, + "mean_token_accuracy": 0.7457735657691955, + "num_tokens": 96061547.0, + "step": 41560 + }, + { + "epoch": 0.3811313835151737, + "learning_rate": 0.00012377555698175484, + "loss": 0.8483, + "mean_token_accuracy": 0.7477504968643188, + "num_tokens": 96084469.0, + "step": 41570 + }, + { + "epoch": 0.381223067754653, + "learning_rate": 0.000123757220133859, + "loss": 0.8195, + "mean_token_accuracy": 0.7502038061618805, + "num_tokens": 96106614.0, + "step": 41580 + }, + { + "epoch": 0.38131475199413223, + "learning_rate": 0.00012373888328596314, + "loss": 0.8362, + "mean_token_accuracy": 0.7560655534267425, + "num_tokens": 96129823.0, + "step": 41590 + }, + { + "epoch": 0.3814064362336114, + "learning_rate": 0.0001237205464380673, + "loss": 0.8237, + "mean_token_accuracy": 0.7563638985157013, + "num_tokens": 96152566.0, + "step": 41600 + }, + { + "epoch": 0.3814981204730907, + "learning_rate": 0.00012370220959017145, + "loss": 0.8346, + "mean_token_accuracy": 0.7453992128372192, + "num_tokens": 96175222.0, + "step": 41610 + }, + { + "epoch": 0.3815898047125699, + "learning_rate": 0.0001236838727422756, + "loss": 0.8499, + "mean_token_accuracy": 0.7355525553226471, + "num_tokens": 96197591.0, + "step": 41620 + }, + { + "epoch": 0.3816814889520491, + "learning_rate": 0.00012366553589437978, + "loss": 0.8649, + "mean_token_accuracy": 0.7429073810577392, + "num_tokens": 96221013.0, + "step": 41630 + }, + { + "epoch": 0.38177317319152837, + "learning_rate": 0.00012364719904648392, + "loss": 0.8443, + "mean_token_accuracy": 0.7413643419742584, + "num_tokens": 96243836.0, + "step": 41640 + }, + { + "epoch": 0.3818648574310076, + "learning_rate": 0.00012362886219858808, + "loss": 0.8604, + "mean_token_accuracy": 0.7440150916576386, + "num_tokens": 96267157.0, + "step": 41650 + }, + { + "epoch": 0.38195654167048687, + "learning_rate": 0.00012361052535069222, + "loss": 0.8339, + "mean_token_accuracy": 0.7463220000267029, + "num_tokens": 96289822.0, + "step": 41660 + }, + { + "epoch": 0.38204822590996607, + "learning_rate": 0.00012359218850279636, + "loss": 0.8804, + "mean_token_accuracy": 0.7378134787082672, + "num_tokens": 96313109.0, + "step": 41670 + }, + { + "epoch": 0.3821399101494453, + "learning_rate": 0.00012357385165490052, + "loss": 0.836, + "mean_token_accuracy": 0.7468629121780396, + "num_tokens": 96335956.0, + "step": 41680 + }, + { + "epoch": 0.38223159438892457, + "learning_rate": 0.0001235555148070047, + "loss": 0.8304, + "mean_token_accuracy": 0.7488134324550628, + "num_tokens": 96359066.0, + "step": 41690 + }, + { + "epoch": 0.38232327862840376, + "learning_rate": 0.00012353717795910883, + "loss": 0.8768, + "mean_token_accuracy": 0.7380219399929047, + "num_tokens": 96383087.0, + "step": 41700 + }, + { + "epoch": 0.382414962867883, + "learning_rate": 0.000123518841111213, + "loss": 0.8441, + "mean_token_accuracy": 0.7522395133972168, + "num_tokens": 96405689.0, + "step": 41710 + }, + { + "epoch": 0.38250664710736226, + "learning_rate": 0.00012350050426331713, + "loss": 0.8496, + "mean_token_accuracy": 0.7440075397491455, + "num_tokens": 96428809.0, + "step": 41720 + }, + { + "epoch": 0.38259833134684146, + "learning_rate": 0.0001234821674154213, + "loss": 0.8331, + "mean_token_accuracy": 0.7506649017333984, + "num_tokens": 96452688.0, + "step": 41730 + }, + { + "epoch": 0.3826900155863207, + "learning_rate": 0.00012346383056752543, + "loss": 0.8637, + "mean_token_accuracy": 0.7435618579387665, + "num_tokens": 96475313.0, + "step": 41740 + }, + { + "epoch": 0.38278169982579996, + "learning_rate": 0.0001234454937196296, + "loss": 0.8683, + "mean_token_accuracy": 0.7351320087909698, + "num_tokens": 96498150.0, + "step": 41750 + }, + { + "epoch": 0.38287338406527915, + "learning_rate": 0.00012342715687173377, + "loss": 0.8123, + "mean_token_accuracy": 0.7541450798511505, + "num_tokens": 96520766.0, + "step": 41760 + }, + { + "epoch": 0.3829650683047584, + "learning_rate": 0.0001234088200238379, + "loss": 0.8532, + "mean_token_accuracy": 0.7484757244586945, + "num_tokens": 96544237.0, + "step": 41770 + }, + { + "epoch": 0.38305675254423766, + "learning_rate": 0.00012339048317594207, + "loss": 0.8635, + "mean_token_accuracy": 0.740970355272293, + "num_tokens": 96566726.0, + "step": 41780 + }, + { + "epoch": 0.3831484367837169, + "learning_rate": 0.0001233721463280462, + "loss": 0.8339, + "mean_token_accuracy": 0.745781946182251, + "num_tokens": 96589099.0, + "step": 41790 + }, + { + "epoch": 0.3832401210231961, + "learning_rate": 0.00012335380948015037, + "loss": 0.8469, + "mean_token_accuracy": 0.7469968736171723, + "num_tokens": 96611204.0, + "step": 41800 + }, + { + "epoch": 0.38333180526267535, + "learning_rate": 0.0001233354726322545, + "loss": 0.8642, + "mean_token_accuracy": 0.7485895335674286, + "num_tokens": 96634671.0, + "step": 41810 + }, + { + "epoch": 0.3834234895021546, + "learning_rate": 0.00012331713578435868, + "loss": 0.8831, + "mean_token_accuracy": 0.7442315816879272, + "num_tokens": 96658050.0, + "step": 41820 + }, + { + "epoch": 0.3835151737416338, + "learning_rate": 0.00012329879893646284, + "loss": 0.8792, + "mean_token_accuracy": 0.7427907228469849, + "num_tokens": 96680366.0, + "step": 41830 + }, + { + "epoch": 0.38360685798111305, + "learning_rate": 0.00012328046208856698, + "loss": 0.8269, + "mean_token_accuracy": 0.7465570032596588, + "num_tokens": 96704047.0, + "step": 41840 + }, + { + "epoch": 0.3836985422205923, + "learning_rate": 0.00012326212524067115, + "loss": 0.8552, + "mean_token_accuracy": 0.7422377943992615, + "num_tokens": 96726945.0, + "step": 41850 + }, + { + "epoch": 0.3837902264600715, + "learning_rate": 0.00012324378839277528, + "loss": 0.8711, + "mean_token_accuracy": 0.7436909973621368, + "num_tokens": 96749645.0, + "step": 41860 + }, + { + "epoch": 0.38388191069955074, + "learning_rate": 0.00012322545154487942, + "loss": 0.8324, + "mean_token_accuracy": 0.7500499904155731, + "num_tokens": 96772768.0, + "step": 41870 + }, + { + "epoch": 0.38397359493903, + "learning_rate": 0.00012320711469698362, + "loss": 0.8649, + "mean_token_accuracy": 0.743410587310791, + "num_tokens": 96796061.0, + "step": 41880 + }, + { + "epoch": 0.3840652791785092, + "learning_rate": 0.00012318877784908775, + "loss": 0.8362, + "mean_token_accuracy": 0.7453331232070923, + "num_tokens": 96819674.0, + "step": 41890 + }, + { + "epoch": 0.38415696341798844, + "learning_rate": 0.0001231704410011919, + "loss": 0.8502, + "mean_token_accuracy": 0.7472075521945953, + "num_tokens": 96842618.0, + "step": 41900 + }, + { + "epoch": 0.3842486476574677, + "learning_rate": 0.00012315210415329606, + "loss": 0.8565, + "mean_token_accuracy": 0.7406310021877289, + "num_tokens": 96865875.0, + "step": 41910 + }, + { + "epoch": 0.38434033189694694, + "learning_rate": 0.0001231337673054002, + "loss": 0.8467, + "mean_token_accuracy": 0.7463303685188294, + "num_tokens": 96888689.0, + "step": 41920 + }, + { + "epoch": 0.38443201613642614, + "learning_rate": 0.00012311543045750436, + "loss": 0.8324, + "mean_token_accuracy": 0.7508059799671173, + "num_tokens": 96911639.0, + "step": 41930 + }, + { + "epoch": 0.3845237003759054, + "learning_rate": 0.0001230970936096085, + "loss": 0.8267, + "mean_token_accuracy": 0.7515237748622894, + "num_tokens": 96934886.0, + "step": 41940 + }, + { + "epoch": 0.38461538461538464, + "learning_rate": 0.00012307875676171266, + "loss": 0.8098, + "mean_token_accuracy": 0.7531907796859741, + "num_tokens": 96958264.0, + "step": 41950 + }, + { + "epoch": 0.38470706885486383, + "learning_rate": 0.00012306041991381683, + "loss": 0.833, + "mean_token_accuracy": 0.7565134763717651, + "num_tokens": 96981073.0, + "step": 41960 + }, + { + "epoch": 0.3847987530943431, + "learning_rate": 0.00012304208306592097, + "loss": 0.838, + "mean_token_accuracy": 0.7485580503940582, + "num_tokens": 97004097.0, + "step": 41970 + }, + { + "epoch": 0.38489043733382233, + "learning_rate": 0.00012302374621802513, + "loss": 0.8537, + "mean_token_accuracy": 0.7474245131015778, + "num_tokens": 97028029.0, + "step": 41980 + }, + { + "epoch": 0.38498212157330153, + "learning_rate": 0.00012300540937012927, + "loss": 0.8595, + "mean_token_accuracy": 0.7395976901054382, + "num_tokens": 97051585.0, + "step": 41990 + }, + { + "epoch": 0.3850738058127808, + "learning_rate": 0.00012298707252223344, + "loss": 0.8598, + "mean_token_accuracy": 0.7424962103366852, + "num_tokens": 97075015.0, + "step": 42000 + }, + { + "epoch": 0.38516549005226003, + "learning_rate": 0.00012296873567433758, + "loss": 0.8325, + "mean_token_accuracy": 0.7579595148563385, + "num_tokens": 97098684.0, + "step": 42010 + }, + { + "epoch": 0.3852571742917392, + "learning_rate": 0.00012295039882644174, + "loss": 0.8374, + "mean_token_accuracy": 0.7485345542430878, + "num_tokens": 97121634.0, + "step": 42020 + }, + { + "epoch": 0.3853488585312185, + "learning_rate": 0.0001229320619785459, + "loss": 0.904, + "mean_token_accuracy": 0.7320353865623475, + "num_tokens": 97143979.0, + "step": 42030 + }, + { + "epoch": 0.3854405427706977, + "learning_rate": 0.00012291372513065004, + "loss": 0.8389, + "mean_token_accuracy": 0.7421582698822021, + "num_tokens": 97167154.0, + "step": 42040 + }, + { + "epoch": 0.385532227010177, + "learning_rate": 0.0001228953882827542, + "loss": 0.8432, + "mean_token_accuracy": 0.7446771323680877, + "num_tokens": 97190056.0, + "step": 42050 + }, + { + "epoch": 0.38562391124965617, + "learning_rate": 0.00012287705143485835, + "loss": 0.854, + "mean_token_accuracy": 0.7453037738800049, + "num_tokens": 97212306.0, + "step": 42060 + }, + { + "epoch": 0.3857155954891354, + "learning_rate": 0.0001228587145869625, + "loss": 0.8621, + "mean_token_accuracy": 0.740193498134613, + "num_tokens": 97235252.0, + "step": 42070 + }, + { + "epoch": 0.38580727972861467, + "learning_rate": 0.00012284037773906668, + "loss": 0.8512, + "mean_token_accuracy": 0.7503459095954895, + "num_tokens": 97258122.0, + "step": 42080 + }, + { + "epoch": 0.38589896396809387, + "learning_rate": 0.00012282204089117082, + "loss": 0.8551, + "mean_token_accuracy": 0.7457744300365448, + "num_tokens": 97281193.0, + "step": 42090 + }, + { + "epoch": 0.3859906482075731, + "learning_rate": 0.00012280370404327496, + "loss": 0.8218, + "mean_token_accuracy": 0.7550775706768036, + "num_tokens": 97304317.0, + "step": 42100 + }, + { + "epoch": 0.38608233244705237, + "learning_rate": 0.00012278536719537912, + "loss": 0.8719, + "mean_token_accuracy": 0.7475060760974884, + "num_tokens": 97326943.0, + "step": 42110 + }, + { + "epoch": 0.38617401668653156, + "learning_rate": 0.00012276703034748326, + "loss": 0.8289, + "mean_token_accuracy": 0.7514943778514862, + "num_tokens": 97350240.0, + "step": 42120 + }, + { + "epoch": 0.3862657009260108, + "learning_rate": 0.00012274869349958743, + "loss": 0.8554, + "mean_token_accuracy": 0.7483797132968902, + "num_tokens": 97373501.0, + "step": 42130 + }, + { + "epoch": 0.38635738516549006, + "learning_rate": 0.00012273035665169156, + "loss": 0.8326, + "mean_token_accuracy": 0.7438017189502716, + "num_tokens": 97396653.0, + "step": 42140 + }, + { + "epoch": 0.38644906940496926, + "learning_rate": 0.00012271201980379573, + "loss": 0.8892, + "mean_token_accuracy": 0.7413406610488892, + "num_tokens": 97420576.0, + "step": 42150 + }, + { + "epoch": 0.3865407536444485, + "learning_rate": 0.0001226936829558999, + "loss": 0.7911, + "mean_token_accuracy": 0.7549246847629547, + "num_tokens": 97443503.0, + "step": 42160 + }, + { + "epoch": 0.38663243788392776, + "learning_rate": 0.00012267534610800403, + "loss": 0.8077, + "mean_token_accuracy": 0.7582757711410523, + "num_tokens": 97466317.0, + "step": 42170 + }, + { + "epoch": 0.386724122123407, + "learning_rate": 0.0001226570092601082, + "loss": 0.8666, + "mean_token_accuracy": 0.7399112820625305, + "num_tokens": 97489520.0, + "step": 42180 + }, + { + "epoch": 0.3868158063628862, + "learning_rate": 0.00012263867241221234, + "loss": 0.8243, + "mean_token_accuracy": 0.747317761182785, + "num_tokens": 97512132.0, + "step": 42190 + }, + { + "epoch": 0.38690749060236546, + "learning_rate": 0.0001226203355643165, + "loss": 0.8308, + "mean_token_accuracy": 0.7511660397052765, + "num_tokens": 97535004.0, + "step": 42200 + }, + { + "epoch": 0.3869991748418447, + "learning_rate": 0.00012260199871642067, + "loss": 0.8471, + "mean_token_accuracy": 0.7478880822658539, + "num_tokens": 97557136.0, + "step": 42210 + }, + { + "epoch": 0.3870908590813239, + "learning_rate": 0.0001225836618685248, + "loss": 0.8666, + "mean_token_accuracy": 0.7463126242160797, + "num_tokens": 97579596.0, + "step": 42220 + }, + { + "epoch": 0.38718254332080315, + "learning_rate": 0.00012256532502062897, + "loss": 0.8444, + "mean_token_accuracy": 0.7474619388580322, + "num_tokens": 97602562.0, + "step": 42230 + }, + { + "epoch": 0.3872742275602824, + "learning_rate": 0.0001225469881727331, + "loss": 0.8184, + "mean_token_accuracy": 0.7536703109741211, + "num_tokens": 97625331.0, + "step": 42240 + }, + { + "epoch": 0.3873659117997616, + "learning_rate": 0.00012252865132483727, + "loss": 0.8307, + "mean_token_accuracy": 0.7487288653850556, + "num_tokens": 97648543.0, + "step": 42250 + }, + { + "epoch": 0.38745759603924085, + "learning_rate": 0.0001225103144769414, + "loss": 0.9086, + "mean_token_accuracy": 0.7395607650279998, + "num_tokens": 97671348.0, + "step": 42260 + }, + { + "epoch": 0.3875492802787201, + "learning_rate": 0.00012249197762904555, + "loss": 0.827, + "mean_token_accuracy": 0.7564811944961548, + "num_tokens": 97694750.0, + "step": 42270 + }, + { + "epoch": 0.38764096451819935, + "learning_rate": 0.00012247364078114974, + "loss": 0.867, + "mean_token_accuracy": 0.7427230477333069, + "num_tokens": 97717795.0, + "step": 42280 + }, + { + "epoch": 0.38773264875767854, + "learning_rate": 0.00012245530393325388, + "loss": 0.848, + "mean_token_accuracy": 0.7396143674850464, + "num_tokens": 97741096.0, + "step": 42290 + }, + { + "epoch": 0.3878243329971578, + "learning_rate": 0.00012243696708535802, + "loss": 0.846, + "mean_token_accuracy": 0.7423577010631561, + "num_tokens": 97764715.0, + "step": 42300 + }, + { + "epoch": 0.38791601723663705, + "learning_rate": 0.00012241863023746219, + "loss": 0.8201, + "mean_token_accuracy": 0.7547329008579254, + "num_tokens": 97787789.0, + "step": 42310 + }, + { + "epoch": 0.38800770147611624, + "learning_rate": 0.00012240029338956632, + "loss": 0.8317, + "mean_token_accuracy": 0.7471260011196137, + "num_tokens": 97811110.0, + "step": 42320 + }, + { + "epoch": 0.3880993857155955, + "learning_rate": 0.0001223819565416705, + "loss": 0.8537, + "mean_token_accuracy": 0.7432671666145325, + "num_tokens": 97833659.0, + "step": 42330 + }, + { + "epoch": 0.38819106995507474, + "learning_rate": 0.00012236361969377466, + "loss": 0.8508, + "mean_token_accuracy": 0.7468033790588379, + "num_tokens": 97856353.0, + "step": 42340 + }, + { + "epoch": 0.38828275419455394, + "learning_rate": 0.0001223452828458788, + "loss": 0.8484, + "mean_token_accuracy": 0.7481363534927368, + "num_tokens": 97878954.0, + "step": 42350 + }, + { + "epoch": 0.3883744384340332, + "learning_rate": 0.00012232694599798296, + "loss": 0.8698, + "mean_token_accuracy": 0.747006356716156, + "num_tokens": 97901800.0, + "step": 42360 + }, + { + "epoch": 0.38846612267351244, + "learning_rate": 0.0001223086091500871, + "loss": 0.8725, + "mean_token_accuracy": 0.739853686094284, + "num_tokens": 97925070.0, + "step": 42370 + }, + { + "epoch": 0.38855780691299163, + "learning_rate": 0.00012229027230219126, + "loss": 0.8405, + "mean_token_accuracy": 0.7503976643085479, + "num_tokens": 97948335.0, + "step": 42380 + }, + { + "epoch": 0.3886494911524709, + "learning_rate": 0.0001222719354542954, + "loss": 0.8567, + "mean_token_accuracy": 0.7516186773777008, + "num_tokens": 97971069.0, + "step": 42390 + }, + { + "epoch": 0.38874117539195013, + "learning_rate": 0.00012225359860639957, + "loss": 0.8584, + "mean_token_accuracy": 0.7411632359027862, + "num_tokens": 97993235.0, + "step": 42400 + }, + { + "epoch": 0.3888328596314294, + "learning_rate": 0.00012223526175850373, + "loss": 0.847, + "mean_token_accuracy": 0.7408832550048828, + "num_tokens": 98016281.0, + "step": 42410 + }, + { + "epoch": 0.3889245438709086, + "learning_rate": 0.00012221692491060787, + "loss": 0.9311, + "mean_token_accuracy": 0.7320229709148407, + "num_tokens": 98039308.0, + "step": 42420 + }, + { + "epoch": 0.38901622811038783, + "learning_rate": 0.00012219858806271204, + "loss": 0.8542, + "mean_token_accuracy": 0.744017893075943, + "num_tokens": 98062055.0, + "step": 42430 + }, + { + "epoch": 0.3891079123498671, + "learning_rate": 0.00012218025121481617, + "loss": 0.848, + "mean_token_accuracy": 0.7475646376609802, + "num_tokens": 98085320.0, + "step": 42440 + }, + { + "epoch": 0.3891995965893463, + "learning_rate": 0.00012216191436692034, + "loss": 0.8589, + "mean_token_accuracy": 0.7441819250583649, + "num_tokens": 98108024.0, + "step": 42450 + }, + { + "epoch": 0.3892912808288255, + "learning_rate": 0.00012214357751902448, + "loss": 0.8901, + "mean_token_accuracy": 0.7354893386363983, + "num_tokens": 98130336.0, + "step": 42460 + }, + { + "epoch": 0.3893829650683048, + "learning_rate": 0.00012212524067112864, + "loss": 0.8666, + "mean_token_accuracy": 0.7383145391941071, + "num_tokens": 98153502.0, + "step": 42470 + }, + { + "epoch": 0.38947464930778397, + "learning_rate": 0.0001221069038232328, + "loss": 0.8717, + "mean_token_accuracy": 0.7394768238067627, + "num_tokens": 98177078.0, + "step": 42480 + }, + { + "epoch": 0.3895663335472632, + "learning_rate": 0.00012208856697533695, + "loss": 0.8478, + "mean_token_accuracy": 0.744846111536026, + "num_tokens": 98200383.0, + "step": 42490 + }, + { + "epoch": 0.38965801778674247, + "learning_rate": 0.0001220702301274411, + "loss": 0.8555, + "mean_token_accuracy": 0.7416116893291473, + "num_tokens": 98223102.0, + "step": 42500 + }, + { + "epoch": 0.38974970202622167, + "learning_rate": 0.00012205189327954525, + "loss": 0.8751, + "mean_token_accuracy": 0.7336749017238617, + "num_tokens": 98246797.0, + "step": 42510 + }, + { + "epoch": 0.3898413862657009, + "learning_rate": 0.0001220335564316494, + "loss": 0.8081, + "mean_token_accuracy": 0.7532801032066345, + "num_tokens": 98269820.0, + "step": 42520 + }, + { + "epoch": 0.38993307050518017, + "learning_rate": 0.00012201521958375355, + "loss": 0.8313, + "mean_token_accuracy": 0.7471497416496277, + "num_tokens": 98293072.0, + "step": 42530 + }, + { + "epoch": 0.3900247547446594, + "learning_rate": 0.00012199688273585772, + "loss": 0.8637, + "mean_token_accuracy": 0.7445648729801178, + "num_tokens": 98315948.0, + "step": 42540 + }, + { + "epoch": 0.3901164389841386, + "learning_rate": 0.00012197854588796187, + "loss": 0.8442, + "mean_token_accuracy": 0.7450841248035431, + "num_tokens": 98338378.0, + "step": 42550 + }, + { + "epoch": 0.39020812322361786, + "learning_rate": 0.00012196020904006602, + "loss": 0.8267, + "mean_token_accuracy": 0.7513948380947113, + "num_tokens": 98362016.0, + "step": 42560 + }, + { + "epoch": 0.3902998074630971, + "learning_rate": 0.00012194187219217018, + "loss": 0.8697, + "mean_token_accuracy": 0.7414669454097748, + "num_tokens": 98385630.0, + "step": 42570 + }, + { + "epoch": 0.3903914917025763, + "learning_rate": 0.00012192353534427431, + "loss": 0.8283, + "mean_token_accuracy": 0.7504765570163727, + "num_tokens": 98408996.0, + "step": 42580 + }, + { + "epoch": 0.39048317594205556, + "learning_rate": 0.00012190519849637847, + "loss": 0.8619, + "mean_token_accuracy": 0.7417500793933869, + "num_tokens": 98432049.0, + "step": 42590 + }, + { + "epoch": 0.3905748601815348, + "learning_rate": 0.00012188686164848264, + "loss": 0.8381, + "mean_token_accuracy": 0.7420496046543121, + "num_tokens": 98455519.0, + "step": 42600 + }, + { + "epoch": 0.390666544421014, + "learning_rate": 0.0001218685248005868, + "loss": 0.8385, + "mean_token_accuracy": 0.7466835856437684, + "num_tokens": 98478520.0, + "step": 42610 + }, + { + "epoch": 0.39075822866049326, + "learning_rate": 0.00012185018795269095, + "loss": 0.7995, + "mean_token_accuracy": 0.7615115284919739, + "num_tokens": 98501855.0, + "step": 42620 + }, + { + "epoch": 0.3908499128999725, + "learning_rate": 0.00012183185110479509, + "loss": 0.8389, + "mean_token_accuracy": 0.7464279592037201, + "num_tokens": 98524679.0, + "step": 42630 + }, + { + "epoch": 0.3909415971394517, + "learning_rate": 0.00012181351425689924, + "loss": 0.8199, + "mean_token_accuracy": 0.7543918073177338, + "num_tokens": 98547887.0, + "step": 42640 + }, + { + "epoch": 0.39103328137893095, + "learning_rate": 0.00012179517740900339, + "loss": 0.8726, + "mean_token_accuracy": 0.7465454757213592, + "num_tokens": 98570755.0, + "step": 42650 + }, + { + "epoch": 0.3911249656184102, + "learning_rate": 0.00012177684056110754, + "loss": 0.8359, + "mean_token_accuracy": 0.7499042809009552, + "num_tokens": 98593619.0, + "step": 42660 + }, + { + "epoch": 0.39121664985788945, + "learning_rate": 0.00012175850371321171, + "loss": 0.8672, + "mean_token_accuracy": 0.739033991098404, + "num_tokens": 98617118.0, + "step": 42670 + }, + { + "epoch": 0.39130833409736865, + "learning_rate": 0.00012174016686531586, + "loss": 0.8327, + "mean_token_accuracy": 0.7493605077266693, + "num_tokens": 98640269.0, + "step": 42680 + }, + { + "epoch": 0.3914000183368479, + "learning_rate": 0.00012172183001742001, + "loss": 0.8561, + "mean_token_accuracy": 0.7385443985462189, + "num_tokens": 98663620.0, + "step": 42690 + }, + { + "epoch": 0.39149170257632715, + "learning_rate": 0.00012170349316952416, + "loss": 0.878, + "mean_token_accuracy": 0.7378088414669037, + "num_tokens": 98685736.0, + "step": 42700 + }, + { + "epoch": 0.39158338681580634, + "learning_rate": 0.00012168515632162831, + "loss": 0.8515, + "mean_token_accuracy": 0.7487938463687897, + "num_tokens": 98709117.0, + "step": 42710 + }, + { + "epoch": 0.3916750710552856, + "learning_rate": 0.00012166681947373247, + "loss": 0.8203, + "mean_token_accuracy": 0.749659925699234, + "num_tokens": 98731923.0, + "step": 42720 + }, + { + "epoch": 0.39176675529476485, + "learning_rate": 0.00012164848262583663, + "loss": 0.8418, + "mean_token_accuracy": 0.7471487343311309, + "num_tokens": 98755131.0, + "step": 42730 + }, + { + "epoch": 0.39185843953424404, + "learning_rate": 0.00012163014577794078, + "loss": 0.8276, + "mean_token_accuracy": 0.7469102501869201, + "num_tokens": 98777466.0, + "step": 42740 + }, + { + "epoch": 0.3919501237737233, + "learning_rate": 0.00012161180893004494, + "loss": 0.8469, + "mean_token_accuracy": 0.7467431008815766, + "num_tokens": 98800678.0, + "step": 42750 + }, + { + "epoch": 0.39204180801320254, + "learning_rate": 0.00012159347208214909, + "loss": 0.8514, + "mean_token_accuracy": 0.7480627417564392, + "num_tokens": 98823655.0, + "step": 42760 + }, + { + "epoch": 0.39213349225268174, + "learning_rate": 0.00012157513523425324, + "loss": 0.873, + "mean_token_accuracy": 0.7421223044395446, + "num_tokens": 98846518.0, + "step": 42770 + }, + { + "epoch": 0.392225176492161, + "learning_rate": 0.00012155679838635738, + "loss": 0.8477, + "mean_token_accuracy": 0.7416431248188019, + "num_tokens": 98869526.0, + "step": 42780 + }, + { + "epoch": 0.39231686073164024, + "learning_rate": 0.00012153846153846153, + "loss": 0.8112, + "mean_token_accuracy": 0.7553065061569214, + "num_tokens": 98892933.0, + "step": 42790 + }, + { + "epoch": 0.3924085449711195, + "learning_rate": 0.00012152012469056571, + "loss": 0.843, + "mean_token_accuracy": 0.7412650406360626, + "num_tokens": 98917050.0, + "step": 42800 + }, + { + "epoch": 0.3925002292105987, + "learning_rate": 0.00012150178784266986, + "loss": 0.8334, + "mean_token_accuracy": 0.7481203973293304, + "num_tokens": 98940712.0, + "step": 42810 + }, + { + "epoch": 0.39259191345007793, + "learning_rate": 0.00012148345099477401, + "loss": 0.8293, + "mean_token_accuracy": 0.7494286298751831, + "num_tokens": 98963947.0, + "step": 42820 + }, + { + "epoch": 0.3926835976895572, + "learning_rate": 0.00012146511414687815, + "loss": 0.8074, + "mean_token_accuracy": 0.750173556804657, + "num_tokens": 98987200.0, + "step": 42830 + }, + { + "epoch": 0.3927752819290364, + "learning_rate": 0.0001214467772989823, + "loss": 0.868, + "mean_token_accuracy": 0.7378338158130646, + "num_tokens": 99009578.0, + "step": 42840 + }, + { + "epoch": 0.39286696616851563, + "learning_rate": 0.00012142844045108645, + "loss": 0.8632, + "mean_token_accuracy": 0.7450571894645691, + "num_tokens": 99032320.0, + "step": 42850 + }, + { + "epoch": 0.3929586504079949, + "learning_rate": 0.00012141010360319063, + "loss": 0.8443, + "mean_token_accuracy": 0.7450294673442841, + "num_tokens": 99055223.0, + "step": 42860 + }, + { + "epoch": 0.3930503346474741, + "learning_rate": 0.00012139176675529477, + "loss": 0.8393, + "mean_token_accuracy": 0.7470239520072937, + "num_tokens": 99078331.0, + "step": 42870 + }, + { + "epoch": 0.3931420188869533, + "learning_rate": 0.00012137342990739892, + "loss": 0.8092, + "mean_token_accuracy": 0.7598694741725922, + "num_tokens": 99101696.0, + "step": 42880 + }, + { + "epoch": 0.3932337031264326, + "learning_rate": 0.00012135509305950308, + "loss": 0.827, + "mean_token_accuracy": 0.7489305198192596, + "num_tokens": 99124755.0, + "step": 42890 + }, + { + "epoch": 0.3933253873659118, + "learning_rate": 0.00012133675621160723, + "loss": 0.8434, + "mean_token_accuracy": 0.7529129922389984, + "num_tokens": 99147473.0, + "step": 42900 + }, + { + "epoch": 0.393417071605391, + "learning_rate": 0.00012131841936371138, + "loss": 0.8458, + "mean_token_accuracy": 0.7490242481231689, + "num_tokens": 99171225.0, + "step": 42910 + }, + { + "epoch": 0.3935087558448703, + "learning_rate": 0.00012130008251581553, + "loss": 0.8284, + "mean_token_accuracy": 0.7435774505138397, + "num_tokens": 99195536.0, + "step": 42920 + }, + { + "epoch": 0.3936004400843495, + "learning_rate": 0.0001212817456679197, + "loss": 0.8307, + "mean_token_accuracy": 0.7494882762432098, + "num_tokens": 99218147.0, + "step": 42930 + }, + { + "epoch": 0.3936921243238287, + "learning_rate": 0.00012126340882002385, + "loss": 0.8304, + "mean_token_accuracy": 0.7515585660934448, + "num_tokens": 99240637.0, + "step": 42940 + }, + { + "epoch": 0.39378380856330797, + "learning_rate": 0.000121245071972128, + "loss": 0.845, + "mean_token_accuracy": 0.7488064289093017, + "num_tokens": 99263733.0, + "step": 42950 + }, + { + "epoch": 0.3938754928027872, + "learning_rate": 0.00012122673512423215, + "loss": 0.9101, + "mean_token_accuracy": 0.7396009862422943, + "num_tokens": 99286473.0, + "step": 42960 + }, + { + "epoch": 0.3939671770422664, + "learning_rate": 0.0001212083982763363, + "loss": 0.8595, + "mean_token_accuracy": 0.743252569437027, + "num_tokens": 99309354.0, + "step": 42970 + }, + { + "epoch": 0.39405886128174566, + "learning_rate": 0.00012119006142844044, + "loss": 0.816, + "mean_token_accuracy": 0.7507643580436707, + "num_tokens": 99331905.0, + "step": 42980 + }, + { + "epoch": 0.3941505455212249, + "learning_rate": 0.00012117172458054462, + "loss": 0.8492, + "mean_token_accuracy": 0.746544623374939, + "num_tokens": 99354264.0, + "step": 42990 + }, + { + "epoch": 0.3942422297607041, + "learning_rate": 0.00012115338773264877, + "loss": 0.8609, + "mean_token_accuracy": 0.7427237629890442, + "num_tokens": 99377357.0, + "step": 43000 + }, + { + "epoch": 0.39433391400018336, + "learning_rate": 0.00012113505088475293, + "loss": 0.8577, + "mean_token_accuracy": 0.7417212784290313, + "num_tokens": 99400242.0, + "step": 43010 + }, + { + "epoch": 0.3944255982396626, + "learning_rate": 0.00012111671403685708, + "loss": 0.842, + "mean_token_accuracy": 0.7445471584796906, + "num_tokens": 99423294.0, + "step": 43020 + }, + { + "epoch": 0.39451728247914186, + "learning_rate": 0.00012109837718896122, + "loss": 0.8659, + "mean_token_accuracy": 0.7416339635848999, + "num_tokens": 99445823.0, + "step": 43030 + }, + { + "epoch": 0.39460896671862106, + "learning_rate": 0.00012108004034106537, + "loss": 0.8688, + "mean_token_accuracy": 0.7422155618667603, + "num_tokens": 99468454.0, + "step": 43040 + }, + { + "epoch": 0.3947006509581003, + "learning_rate": 0.00012106170349316952, + "loss": 0.8361, + "mean_token_accuracy": 0.7583410799503326, + "num_tokens": 99491409.0, + "step": 43050 + }, + { + "epoch": 0.39479233519757956, + "learning_rate": 0.0001210433666452737, + "loss": 0.8369, + "mean_token_accuracy": 0.7550324678421021, + "num_tokens": 99514341.0, + "step": 43060 + }, + { + "epoch": 0.39488401943705875, + "learning_rate": 0.00012102502979737784, + "loss": 0.8803, + "mean_token_accuracy": 0.7441314160823822, + "num_tokens": 99537581.0, + "step": 43070 + }, + { + "epoch": 0.394975703676538, + "learning_rate": 0.00012100669294948199, + "loss": 0.8515, + "mean_token_accuracy": 0.7438615500926972, + "num_tokens": 99560268.0, + "step": 43080 + }, + { + "epoch": 0.39506738791601725, + "learning_rate": 0.00012098835610158614, + "loss": 0.8457, + "mean_token_accuracy": 0.7410091102123261, + "num_tokens": 99583320.0, + "step": 43090 + }, + { + "epoch": 0.39515907215549645, + "learning_rate": 0.00012097001925369029, + "loss": 0.8483, + "mean_token_accuracy": 0.7494796335697174, + "num_tokens": 99606247.0, + "step": 43100 + }, + { + "epoch": 0.3952507563949757, + "learning_rate": 0.00012095168240579444, + "loss": 0.8149, + "mean_token_accuracy": 0.7595623373985291, + "num_tokens": 99629914.0, + "step": 43110 + }, + { + "epoch": 0.39534244063445495, + "learning_rate": 0.00012093334555789861, + "loss": 0.8512, + "mean_token_accuracy": 0.7407776236534118, + "num_tokens": 99652816.0, + "step": 43120 + }, + { + "epoch": 0.39543412487393415, + "learning_rate": 0.00012091500871000276, + "loss": 0.8373, + "mean_token_accuracy": 0.7508548200130463, + "num_tokens": 99676031.0, + "step": 43130 + }, + { + "epoch": 0.3955258091134134, + "learning_rate": 0.00012089667186210691, + "loss": 0.8636, + "mean_token_accuracy": 0.7446913063526154, + "num_tokens": 99699036.0, + "step": 43140 + }, + { + "epoch": 0.39561749335289265, + "learning_rate": 0.00012087833501421106, + "loss": 0.8713, + "mean_token_accuracy": 0.7402331829071045, + "num_tokens": 99722190.0, + "step": 43150 + }, + { + "epoch": 0.3957091775923719, + "learning_rate": 0.00012085999816631522, + "loss": 0.8153, + "mean_token_accuracy": 0.750926959514618, + "num_tokens": 99745313.0, + "step": 43160 + }, + { + "epoch": 0.3958008618318511, + "learning_rate": 0.00012084166131841937, + "loss": 0.8101, + "mean_token_accuracy": 0.7540000259876252, + "num_tokens": 99768305.0, + "step": 43170 + }, + { + "epoch": 0.39589254607133034, + "learning_rate": 0.00012082332447052351, + "loss": 0.8608, + "mean_token_accuracy": 0.7495555579662323, + "num_tokens": 99792280.0, + "step": 43180 + }, + { + "epoch": 0.3959842303108096, + "learning_rate": 0.00012080498762262769, + "loss": 0.8031, + "mean_token_accuracy": 0.7534538269042969, + "num_tokens": 99815372.0, + "step": 43190 + }, + { + "epoch": 0.3960759145502888, + "learning_rate": 0.00012078665077473184, + "loss": 0.88, + "mean_token_accuracy": 0.7427812039852142, + "num_tokens": 99838466.0, + "step": 43200 + }, + { + "epoch": 0.39616759878976804, + "learning_rate": 0.00012076831392683599, + "loss": 0.8639, + "mean_token_accuracy": 0.741842633485794, + "num_tokens": 99862328.0, + "step": 43210 + }, + { + "epoch": 0.3962592830292473, + "learning_rate": 0.00012074997707894014, + "loss": 0.8568, + "mean_token_accuracy": 0.7447823584079742, + "num_tokens": 99884941.0, + "step": 43220 + }, + { + "epoch": 0.3963509672687265, + "learning_rate": 0.00012073164023104428, + "loss": 0.8504, + "mean_token_accuracy": 0.7410430669784546, + "num_tokens": 99907642.0, + "step": 43230 + }, + { + "epoch": 0.39644265150820573, + "learning_rate": 0.00012071330338314843, + "loss": 0.8472, + "mean_token_accuracy": 0.7453603327274323, + "num_tokens": 99930851.0, + "step": 43240 + }, + { + "epoch": 0.396534335747685, + "learning_rate": 0.00012069496653525258, + "loss": 0.8579, + "mean_token_accuracy": 0.7414930880069732, + "num_tokens": 99953855.0, + "step": 43250 + }, + { + "epoch": 0.3966260199871642, + "learning_rate": 0.00012067662968735676, + "loss": 0.8482, + "mean_token_accuracy": 0.7489110469818115, + "num_tokens": 99976786.0, + "step": 43260 + }, + { + "epoch": 0.39671770422664343, + "learning_rate": 0.0001206582928394609, + "loss": 0.8079, + "mean_token_accuracy": 0.7556454241275787, + "num_tokens": 99999249.0, + "step": 43270 + }, + { + "epoch": 0.3968093884661227, + "learning_rate": 0.00012063995599156505, + "loss": 0.8448, + "mean_token_accuracy": 0.7377425312995911, + "num_tokens": 100021933.0, + "step": 43280 + }, + { + "epoch": 0.39690107270560193, + "learning_rate": 0.0001206216191436692, + "loss": 0.8017, + "mean_token_accuracy": 0.760702782869339, + "num_tokens": 100045196.0, + "step": 43290 + }, + { + "epoch": 0.3969927569450811, + "learning_rate": 0.00012060328229577336, + "loss": 0.819, + "mean_token_accuracy": 0.744375479221344, + "num_tokens": 100068677.0, + "step": 43300 + }, + { + "epoch": 0.3970844411845604, + "learning_rate": 0.00012058494544787751, + "loss": 0.8532, + "mean_token_accuracy": 0.7433301329612731, + "num_tokens": 100092304.0, + "step": 43310 + }, + { + "epoch": 0.3971761254240396, + "learning_rate": 0.00012056660859998167, + "loss": 0.8163, + "mean_token_accuracy": 0.7581689298152924, + "num_tokens": 100115907.0, + "step": 43320 + }, + { + "epoch": 0.3972678096635188, + "learning_rate": 0.00012054827175208583, + "loss": 0.8598, + "mean_token_accuracy": 0.7469379425048828, + "num_tokens": 100139640.0, + "step": 43330 + }, + { + "epoch": 0.3973594939029981, + "learning_rate": 0.00012052993490418998, + "loss": 0.8272, + "mean_token_accuracy": 0.7534853637218475, + "num_tokens": 100162485.0, + "step": 43340 + }, + { + "epoch": 0.3974511781424773, + "learning_rate": 0.00012051159805629413, + "loss": 0.8403, + "mean_token_accuracy": 0.7501318275928497, + "num_tokens": 100185141.0, + "step": 43350 + }, + { + "epoch": 0.3975428623819565, + "learning_rate": 0.00012049326120839828, + "loss": 0.8592, + "mean_token_accuracy": 0.7472609996795654, + "num_tokens": 100207347.0, + "step": 43360 + }, + { + "epoch": 0.39763454662143577, + "learning_rate": 0.00012047492436050243, + "loss": 0.887, + "mean_token_accuracy": 0.7339904844760895, + "num_tokens": 100230845.0, + "step": 43370 + }, + { + "epoch": 0.397726230860915, + "learning_rate": 0.00012045658751260657, + "loss": 0.8466, + "mean_token_accuracy": 0.7437448918819427, + "num_tokens": 100253777.0, + "step": 43380 + }, + { + "epoch": 0.3978179151003942, + "learning_rate": 0.00012043825066471075, + "loss": 0.8404, + "mean_token_accuracy": 0.7450472593307496, + "num_tokens": 100277783.0, + "step": 43390 + }, + { + "epoch": 0.39790959933987347, + "learning_rate": 0.0001204199138168149, + "loss": 0.8272, + "mean_token_accuracy": 0.7582185566425323, + "num_tokens": 100300341.0, + "step": 43400 + }, + { + "epoch": 0.3980012835793527, + "learning_rate": 0.00012040157696891905, + "loss": 0.8411, + "mean_token_accuracy": 0.7432398974895478, + "num_tokens": 100323475.0, + "step": 43410 + }, + { + "epoch": 0.39809296781883197, + "learning_rate": 0.0001203832401210232, + "loss": 0.8475, + "mean_token_accuracy": 0.7457428812980652, + "num_tokens": 100346552.0, + "step": 43420 + }, + { + "epoch": 0.39818465205831116, + "learning_rate": 0.00012036490327312734, + "loss": 0.8252, + "mean_token_accuracy": 0.7546516418457031, + "num_tokens": 100370155.0, + "step": 43430 + }, + { + "epoch": 0.3982763362977904, + "learning_rate": 0.0001203465664252315, + "loss": 0.861, + "mean_token_accuracy": 0.7470997512340546, + "num_tokens": 100393240.0, + "step": 43440 + }, + { + "epoch": 0.39836802053726966, + "learning_rate": 0.00012032822957733568, + "loss": 0.8607, + "mean_token_accuracy": 0.7425906300544739, + "num_tokens": 100416700.0, + "step": 43450 + }, + { + "epoch": 0.39845970477674886, + "learning_rate": 0.00012030989272943983, + "loss": 0.8386, + "mean_token_accuracy": 0.7485748767852783, + "num_tokens": 100441329.0, + "step": 43460 + }, + { + "epoch": 0.3985513890162281, + "learning_rate": 0.00012029155588154397, + "loss": 0.8715, + "mean_token_accuracy": 0.7444190859794617, + "num_tokens": 100464254.0, + "step": 43470 + }, + { + "epoch": 0.39864307325570736, + "learning_rate": 0.00012027321903364812, + "loss": 0.8355, + "mean_token_accuracy": 0.7469911396503448, + "num_tokens": 100486921.0, + "step": 43480 + }, + { + "epoch": 0.39873475749518655, + "learning_rate": 0.00012025488218575227, + "loss": 0.8213, + "mean_token_accuracy": 0.748364919424057, + "num_tokens": 100509643.0, + "step": 43490 + }, + { + "epoch": 0.3988264417346658, + "learning_rate": 0.00012023654533785642, + "loss": 0.8507, + "mean_token_accuracy": 0.7430125772953033, + "num_tokens": 100533152.0, + "step": 43500 + }, + { + "epoch": 0.39891812597414505, + "learning_rate": 0.00012021820848996057, + "loss": 0.8543, + "mean_token_accuracy": 0.7426909685134888, + "num_tokens": 100556596.0, + "step": 43510 + }, + { + "epoch": 0.3990098102136243, + "learning_rate": 0.00012019987164206474, + "loss": 0.8448, + "mean_token_accuracy": 0.7450658738613128, + "num_tokens": 100580296.0, + "step": 43520 + }, + { + "epoch": 0.3991014944531035, + "learning_rate": 0.00012018153479416889, + "loss": 0.8528, + "mean_token_accuracy": 0.7435936272144318, + "num_tokens": 100602819.0, + "step": 43530 + }, + { + "epoch": 0.39919317869258275, + "learning_rate": 0.00012016319794627304, + "loss": 0.8497, + "mean_token_accuracy": 0.7447150588035584, + "num_tokens": 100625938.0, + "step": 43540 + }, + { + "epoch": 0.399284862932062, + "learning_rate": 0.0001201448610983772, + "loss": 0.8558, + "mean_token_accuracy": 0.7477009654045105, + "num_tokens": 100649270.0, + "step": 43550 + }, + { + "epoch": 0.3993765471715412, + "learning_rate": 0.00012012652425048135, + "loss": 0.803, + "mean_token_accuracy": 0.7549422085285187, + "num_tokens": 100671672.0, + "step": 43560 + }, + { + "epoch": 0.39946823141102045, + "learning_rate": 0.0001201081874025855, + "loss": 0.8285, + "mean_token_accuracy": 0.7511558353900909, + "num_tokens": 100694873.0, + "step": 43570 + }, + { + "epoch": 0.3995599156504997, + "learning_rate": 0.00012008985055468966, + "loss": 0.821, + "mean_token_accuracy": 0.7527211785316468, + "num_tokens": 100718075.0, + "step": 43580 + }, + { + "epoch": 0.3996515998899789, + "learning_rate": 0.00012007151370679381, + "loss": 0.8583, + "mean_token_accuracy": 0.7468614757061005, + "num_tokens": 100741696.0, + "step": 43590 + }, + { + "epoch": 0.39974328412945814, + "learning_rate": 0.00012005317685889797, + "loss": 0.8612, + "mean_token_accuracy": 0.7396007180213928, + "num_tokens": 100765060.0, + "step": 43600 + }, + { + "epoch": 0.3998349683689374, + "learning_rate": 0.00012003484001100212, + "loss": 0.8714, + "mean_token_accuracy": 0.7453867971897126, + "num_tokens": 100787963.0, + "step": 43610 + }, + { + "epoch": 0.3999266526084166, + "learning_rate": 0.00012001650316310627, + "loss": 0.8341, + "mean_token_accuracy": 0.747481620311737, + "num_tokens": 100811178.0, + "step": 43620 + }, + { + "epoch": 0.40001833684789584, + "learning_rate": 0.00011999816631521041, + "loss": 0.7975, + "mean_token_accuracy": 0.7568912744522095, + "num_tokens": 100834528.0, + "step": 43630 + }, + { + "epoch": 0.4001100210873751, + "learning_rate": 0.00011997982946731456, + "loss": 0.8208, + "mean_token_accuracy": 0.7569917798042297, + "num_tokens": 100857446.0, + "step": 43640 + }, + { + "epoch": 0.40020170532685434, + "learning_rate": 0.00011996149261941874, + "loss": 0.8304, + "mean_token_accuracy": 0.7474347651004791, + "num_tokens": 100880370.0, + "step": 43650 + }, + { + "epoch": 0.40029338956633354, + "learning_rate": 0.00011994315577152289, + "loss": 0.8183, + "mean_token_accuracy": 0.7509926438331604, + "num_tokens": 100903945.0, + "step": 43660 + }, + { + "epoch": 0.4003850738058128, + "learning_rate": 0.00011992481892362703, + "loss": 0.8228, + "mean_token_accuracy": 0.7485302925109864, + "num_tokens": 100928168.0, + "step": 43670 + }, + { + "epoch": 0.40047675804529204, + "learning_rate": 0.00011990648207573118, + "loss": 0.8492, + "mean_token_accuracy": 0.7437901318073272, + "num_tokens": 100951180.0, + "step": 43680 + }, + { + "epoch": 0.40056844228477123, + "learning_rate": 0.00011988814522783533, + "loss": 0.8741, + "mean_token_accuracy": 0.7450493574142456, + "num_tokens": 100975076.0, + "step": 43690 + }, + { + "epoch": 0.4006601265242505, + "learning_rate": 0.00011986980837993949, + "loss": 0.8482, + "mean_token_accuracy": 0.7441963791847229, + "num_tokens": 100997457.0, + "step": 43700 + }, + { + "epoch": 0.40075181076372973, + "learning_rate": 0.00011985147153204366, + "loss": 0.8509, + "mean_token_accuracy": 0.7498200833797455, + "num_tokens": 101019465.0, + "step": 43710 + }, + { + "epoch": 0.4008434950032089, + "learning_rate": 0.0001198331346841478, + "loss": 0.8061, + "mean_token_accuracy": 0.7549359560012817, + "num_tokens": 101041935.0, + "step": 43720 + }, + { + "epoch": 0.4009351792426882, + "learning_rate": 0.00011981479783625195, + "loss": 0.8544, + "mean_token_accuracy": 0.7457621693611145, + "num_tokens": 101064399.0, + "step": 43730 + }, + { + "epoch": 0.40102686348216743, + "learning_rate": 0.0001197964609883561, + "loss": 0.8586, + "mean_token_accuracy": 0.7421365141868591, + "num_tokens": 101087211.0, + "step": 43740 + }, + { + "epoch": 0.4011185477216466, + "learning_rate": 0.00011977812414046026, + "loss": 0.837, + "mean_token_accuracy": 0.7481885135173798, + "num_tokens": 101110590.0, + "step": 43750 + }, + { + "epoch": 0.4012102319611259, + "learning_rate": 0.00011975978729256441, + "loss": 0.8816, + "mean_token_accuracy": 0.7407104909420014, + "num_tokens": 101132886.0, + "step": 43760 + }, + { + "epoch": 0.4013019162006051, + "learning_rate": 0.00011974145044466856, + "loss": 0.8582, + "mean_token_accuracy": 0.7441464364528656, + "num_tokens": 101156067.0, + "step": 43770 + }, + { + "epoch": 0.4013936004400844, + "learning_rate": 0.00011972311359677273, + "loss": 0.8721, + "mean_token_accuracy": 0.7364722907543182, + "num_tokens": 101178662.0, + "step": 43780 + }, + { + "epoch": 0.40148528467956357, + "learning_rate": 0.00011970477674887688, + "loss": 0.8405, + "mean_token_accuracy": 0.7392441511154175, + "num_tokens": 101201467.0, + "step": 43790 + }, + { + "epoch": 0.4015769689190428, + "learning_rate": 0.00011968643990098103, + "loss": 0.8537, + "mean_token_accuracy": 0.7440224051475525, + "num_tokens": 101223977.0, + "step": 43800 + }, + { + "epoch": 0.40166865315852207, + "learning_rate": 0.00011966810305308518, + "loss": 0.8452, + "mean_token_accuracy": 0.7479540884494782, + "num_tokens": 101247890.0, + "step": 43810 + }, + { + "epoch": 0.40176033739800127, + "learning_rate": 0.00011964976620518933, + "loss": 0.8483, + "mean_token_accuracy": 0.7450882971286774, + "num_tokens": 101271332.0, + "step": 43820 + }, + { + "epoch": 0.4018520216374805, + "learning_rate": 0.00011963142935729347, + "loss": 0.8558, + "mean_token_accuracy": 0.7435620367527008, + "num_tokens": 101294299.0, + "step": 43830 + }, + { + "epoch": 0.40194370587695977, + "learning_rate": 0.00011961309250939765, + "loss": 0.8206, + "mean_token_accuracy": 0.7506714522838592, + "num_tokens": 101316883.0, + "step": 43840 + }, + { + "epoch": 0.40203539011643896, + "learning_rate": 0.0001195947556615018, + "loss": 0.8718, + "mean_token_accuracy": 0.7427827298641205, + "num_tokens": 101339963.0, + "step": 43850 + }, + { + "epoch": 0.4021270743559182, + "learning_rate": 0.00011957641881360596, + "loss": 0.8667, + "mean_token_accuracy": 0.7400134563446045, + "num_tokens": 101362611.0, + "step": 43860 + }, + { + "epoch": 0.40221875859539746, + "learning_rate": 0.0001195580819657101, + "loss": 0.806, + "mean_token_accuracy": 0.7647567331790924, + "num_tokens": 101385865.0, + "step": 43870 + }, + { + "epoch": 0.40231044283487666, + "learning_rate": 0.00011953974511781425, + "loss": 0.8297, + "mean_token_accuracy": 0.7499696552753449, + "num_tokens": 101409036.0, + "step": 43880 + }, + { + "epoch": 0.4024021270743559, + "learning_rate": 0.0001195214082699184, + "loss": 0.8476, + "mean_token_accuracy": 0.7489574372768402, + "num_tokens": 101432714.0, + "step": 43890 + }, + { + "epoch": 0.40249381131383516, + "learning_rate": 0.00011950307142202255, + "loss": 0.838, + "mean_token_accuracy": 0.7476186215877533, + "num_tokens": 101455873.0, + "step": 43900 + }, + { + "epoch": 0.4025854955533144, + "learning_rate": 0.00011948473457412673, + "loss": 0.8823, + "mean_token_accuracy": 0.7406718492507934, + "num_tokens": 101479168.0, + "step": 43910 + }, + { + "epoch": 0.4026771797927936, + "learning_rate": 0.00011946639772623087, + "loss": 0.802, + "mean_token_accuracy": 0.7554150402545929, + "num_tokens": 101502172.0, + "step": 43920 + }, + { + "epoch": 0.40276886403227286, + "learning_rate": 0.00011944806087833502, + "loss": 0.8512, + "mean_token_accuracy": 0.7441450178623199, + "num_tokens": 101524795.0, + "step": 43930 + }, + { + "epoch": 0.4028605482717521, + "learning_rate": 0.00011942972403043917, + "loss": 0.8607, + "mean_token_accuracy": 0.7382725477218628, + "num_tokens": 101547878.0, + "step": 43940 + }, + { + "epoch": 0.4029522325112313, + "learning_rate": 0.00011941138718254332, + "loss": 0.8598, + "mean_token_accuracy": 0.7430664479732514, + "num_tokens": 101571696.0, + "step": 43950 + }, + { + "epoch": 0.40304391675071055, + "learning_rate": 0.00011939305033464747, + "loss": 0.8598, + "mean_token_accuracy": 0.7453457295894623, + "num_tokens": 101595070.0, + "step": 43960 + }, + { + "epoch": 0.4031356009901898, + "learning_rate": 0.00011937471348675164, + "loss": 0.8905, + "mean_token_accuracy": 0.7316078066825866, + "num_tokens": 101618211.0, + "step": 43970 + }, + { + "epoch": 0.403227285229669, + "learning_rate": 0.00011935637663885579, + "loss": 0.8701, + "mean_token_accuracy": 0.7397210478782654, + "num_tokens": 101641912.0, + "step": 43980 + }, + { + "epoch": 0.40331896946914825, + "learning_rate": 0.00011933803979095994, + "loss": 0.8556, + "mean_token_accuracy": 0.7466451168060303, + "num_tokens": 101665133.0, + "step": 43990 + }, + { + "epoch": 0.4034106537086275, + "learning_rate": 0.0001193197029430641, + "loss": 0.8315, + "mean_token_accuracy": 0.7544361591339112, + "num_tokens": 101687839.0, + "step": 44000 + }, + { + "epoch": 0.4035023379481067, + "learning_rate": 0.00011930136609516825, + "loss": 0.83, + "mean_token_accuracy": 0.7543080925941468, + "num_tokens": 101711127.0, + "step": 44010 + }, + { + "epoch": 0.40359402218758594, + "learning_rate": 0.0001192830292472724, + "loss": 0.8526, + "mean_token_accuracy": 0.7467760264873504, + "num_tokens": 101734011.0, + "step": 44020 + }, + { + "epoch": 0.4036857064270652, + "learning_rate": 0.00011926469239937654, + "loss": 0.8638, + "mean_token_accuracy": 0.7457446813583374, + "num_tokens": 101756746.0, + "step": 44030 + }, + { + "epoch": 0.40377739066654444, + "learning_rate": 0.00011924635555148072, + "loss": 0.8521, + "mean_token_accuracy": 0.747233772277832, + "num_tokens": 101779213.0, + "step": 44040 + }, + { + "epoch": 0.40386907490602364, + "learning_rate": 0.00011922801870358487, + "loss": 0.8582, + "mean_token_accuracy": 0.745703935623169, + "num_tokens": 101802158.0, + "step": 44050 + }, + { + "epoch": 0.4039607591455029, + "learning_rate": 0.00011920968185568902, + "loss": 0.8628, + "mean_token_accuracy": 0.7423049509525299, + "num_tokens": 101826496.0, + "step": 44060 + }, + { + "epoch": 0.40405244338498214, + "learning_rate": 0.00011919134500779316, + "loss": 0.8436, + "mean_token_accuracy": 0.7474491834640503, + "num_tokens": 101850270.0, + "step": 44070 + }, + { + "epoch": 0.40414412762446134, + "learning_rate": 0.00011917300815989731, + "loss": 0.8596, + "mean_token_accuracy": 0.7463626205921173, + "num_tokens": 101873556.0, + "step": 44080 + }, + { + "epoch": 0.4042358118639406, + "learning_rate": 0.00011915467131200146, + "loss": 0.8452, + "mean_token_accuracy": 0.7486437380313873, + "num_tokens": 101895943.0, + "step": 44090 + }, + { + "epoch": 0.40432749610341984, + "learning_rate": 0.00011913633446410564, + "loss": 0.8374, + "mean_token_accuracy": 0.7513238906860351, + "num_tokens": 101918519.0, + "step": 44100 + }, + { + "epoch": 0.40441918034289903, + "learning_rate": 0.0001191179976162098, + "loss": 0.8215, + "mean_token_accuracy": 0.7529733896255493, + "num_tokens": 101941660.0, + "step": 44110 + }, + { + "epoch": 0.4045108645823783, + "learning_rate": 0.00011909966076831393, + "loss": 0.824, + "mean_token_accuracy": 0.7548643171787262, + "num_tokens": 101965299.0, + "step": 44120 + }, + { + "epoch": 0.40460254882185753, + "learning_rate": 0.00011908132392041808, + "loss": 0.8469, + "mean_token_accuracy": 0.7420718908309937, + "num_tokens": 101987681.0, + "step": 44130 + }, + { + "epoch": 0.4046942330613368, + "learning_rate": 0.00011906298707252224, + "loss": 0.8319, + "mean_token_accuracy": 0.746285080909729, + "num_tokens": 102011072.0, + "step": 44140 + }, + { + "epoch": 0.404785917300816, + "learning_rate": 0.00011904465022462639, + "loss": 0.8826, + "mean_token_accuracy": 0.734488719701767, + "num_tokens": 102034292.0, + "step": 44150 + }, + { + "epoch": 0.40487760154029523, + "learning_rate": 0.00011902631337673054, + "loss": 0.8133, + "mean_token_accuracy": 0.7553673982620239, + "num_tokens": 102057192.0, + "step": 44160 + }, + { + "epoch": 0.4049692857797745, + "learning_rate": 0.0001190079765288347, + "loss": 0.8558, + "mean_token_accuracy": 0.747709047794342, + "num_tokens": 102081059.0, + "step": 44170 + }, + { + "epoch": 0.4050609700192537, + "learning_rate": 0.00011898963968093886, + "loss": 0.8484, + "mean_token_accuracy": 0.7444964587688446, + "num_tokens": 102103572.0, + "step": 44180 + }, + { + "epoch": 0.4051526542587329, + "learning_rate": 0.00011897130283304301, + "loss": 0.8652, + "mean_token_accuracy": 0.7443179070949555, + "num_tokens": 102126442.0, + "step": 44190 + }, + { + "epoch": 0.4052443384982122, + "learning_rate": 0.00011895296598514716, + "loss": 0.8333, + "mean_token_accuracy": 0.7456013679504394, + "num_tokens": 102150062.0, + "step": 44200 + }, + { + "epoch": 0.40533602273769137, + "learning_rate": 0.00011893462913725131, + "loss": 0.8189, + "mean_token_accuracy": 0.7510856688022614, + "num_tokens": 102172765.0, + "step": 44210 + }, + { + "epoch": 0.4054277069771706, + "learning_rate": 0.00011891629228935546, + "loss": 0.8832, + "mean_token_accuracy": 0.7396148025989533, + "num_tokens": 102195726.0, + "step": 44220 + }, + { + "epoch": 0.40551939121664987, + "learning_rate": 0.00011889795544145963, + "loss": 0.8657, + "mean_token_accuracy": 0.7436016976833344, + "num_tokens": 102218803.0, + "step": 44230 + }, + { + "epoch": 0.40561107545612907, + "learning_rate": 0.00011887961859356378, + "loss": 0.8285, + "mean_token_accuracy": 0.7495310842990875, + "num_tokens": 102241640.0, + "step": 44240 + }, + { + "epoch": 0.4057027596956083, + "learning_rate": 0.00011886128174566793, + "loss": 0.84, + "mean_token_accuracy": 0.744154554605484, + "num_tokens": 102264526.0, + "step": 44250 + }, + { + "epoch": 0.40579444393508757, + "learning_rate": 0.00011884294489777208, + "loss": 0.86, + "mean_token_accuracy": 0.7446904242038727, + "num_tokens": 102287369.0, + "step": 44260 + }, + { + "epoch": 0.4058861281745668, + "learning_rate": 0.00011882460804987622, + "loss": 0.8619, + "mean_token_accuracy": 0.7469142735004425, + "num_tokens": 102309206.0, + "step": 44270 + }, + { + "epoch": 0.405977812414046, + "learning_rate": 0.00011880627120198037, + "loss": 0.8252, + "mean_token_accuracy": 0.7514234960079194, + "num_tokens": 102332607.0, + "step": 44280 + }, + { + "epoch": 0.40606949665352526, + "learning_rate": 0.00011878793435408453, + "loss": 0.8261, + "mean_token_accuracy": 0.7492182672023773, + "num_tokens": 102355420.0, + "step": 44290 + }, + { + "epoch": 0.4061611808930045, + "learning_rate": 0.0001187695975061887, + "loss": 0.8296, + "mean_token_accuracy": 0.7488252580165863, + "num_tokens": 102378099.0, + "step": 44300 + }, + { + "epoch": 0.4062528651324837, + "learning_rate": 0.00011875126065829286, + "loss": 0.8359, + "mean_token_accuracy": 0.7438942015171051, + "num_tokens": 102400457.0, + "step": 44310 + }, + { + "epoch": 0.40634454937196296, + "learning_rate": 0.000118732923810397, + "loss": 0.8376, + "mean_token_accuracy": 0.7458237946033478, + "num_tokens": 102423634.0, + "step": 44320 + }, + { + "epoch": 0.4064362336114422, + "learning_rate": 0.00011871458696250115, + "loss": 0.8316, + "mean_token_accuracy": 0.7501737952232361, + "num_tokens": 102446648.0, + "step": 44330 + }, + { + "epoch": 0.4065279178509214, + "learning_rate": 0.0001186962501146053, + "loss": 0.8217, + "mean_token_accuracy": 0.7535607576370239, + "num_tokens": 102469286.0, + "step": 44340 + }, + { + "epoch": 0.40661960209040066, + "learning_rate": 0.00011867791326670945, + "loss": 0.8618, + "mean_token_accuracy": 0.745497316122055, + "num_tokens": 102492018.0, + "step": 44350 + }, + { + "epoch": 0.4067112863298799, + "learning_rate": 0.0001186595764188136, + "loss": 0.8541, + "mean_token_accuracy": 0.7416003167629241, + "num_tokens": 102515303.0, + "step": 44360 + }, + { + "epoch": 0.4068029705693591, + "learning_rate": 0.00011864123957091777, + "loss": 0.8378, + "mean_token_accuracy": 0.7473686873912812, + "num_tokens": 102538681.0, + "step": 44370 + }, + { + "epoch": 0.40689465480883835, + "learning_rate": 0.00011862290272302192, + "loss": 0.8094, + "mean_token_accuracy": 0.7564398288726807, + "num_tokens": 102561937.0, + "step": 44380 + }, + { + "epoch": 0.4069863390483176, + "learning_rate": 0.00011860456587512607, + "loss": 0.8623, + "mean_token_accuracy": 0.7400487780570983, + "num_tokens": 102586449.0, + "step": 44390 + }, + { + "epoch": 0.40707802328779685, + "learning_rate": 0.00011858622902723022, + "loss": 0.8508, + "mean_token_accuracy": 0.7529193341732026, + "num_tokens": 102609825.0, + "step": 44400 + }, + { + "epoch": 0.40716970752727605, + "learning_rate": 0.00011856789217933438, + "loss": 0.8672, + "mean_token_accuracy": 0.7442286550998688, + "num_tokens": 102632464.0, + "step": 44410 + }, + { + "epoch": 0.4072613917667553, + "learning_rate": 0.00011854955533143853, + "loss": 0.8463, + "mean_token_accuracy": 0.7453698098659516, + "num_tokens": 102655420.0, + "step": 44420 + }, + { + "epoch": 0.40735307600623455, + "learning_rate": 0.0001185312184835427, + "loss": 0.8175, + "mean_token_accuracy": 0.7565670073032379, + "num_tokens": 102677858.0, + "step": 44430 + }, + { + "epoch": 0.40744476024571374, + "learning_rate": 0.00011851288163564685, + "loss": 0.8393, + "mean_token_accuracy": 0.7486736238002777, + "num_tokens": 102701173.0, + "step": 44440 + }, + { + "epoch": 0.407536444485193, + "learning_rate": 0.000118494544787751, + "loss": 0.8521, + "mean_token_accuracy": 0.7465475678443909, + "num_tokens": 102723990.0, + "step": 44450 + }, + { + "epoch": 0.40762812872467225, + "learning_rate": 0.00011847620793985515, + "loss": 0.8484, + "mean_token_accuracy": 0.7493509948253632, + "num_tokens": 102746923.0, + "step": 44460 + }, + { + "epoch": 0.40771981296415144, + "learning_rate": 0.00011845787109195929, + "loss": 0.8246, + "mean_token_accuracy": 0.7481965899467469, + "num_tokens": 102769325.0, + "step": 44470 + }, + { + "epoch": 0.4078114972036307, + "learning_rate": 0.00011843953424406344, + "loss": 0.8743, + "mean_token_accuracy": 0.739555686712265, + "num_tokens": 102791877.0, + "step": 44480 + }, + { + "epoch": 0.40790318144310994, + "learning_rate": 0.00011842119739616759, + "loss": 0.8601, + "mean_token_accuracy": 0.7448561131954193, + "num_tokens": 102815231.0, + "step": 44490 + }, + { + "epoch": 0.40799486568258914, + "learning_rate": 0.00011840286054827177, + "loss": 0.8747, + "mean_token_accuracy": 0.7401957511901855, + "num_tokens": 102838475.0, + "step": 44500 + }, + { + "epoch": 0.4080865499220684, + "learning_rate": 0.00011838452370037592, + "loss": 0.8054, + "mean_token_accuracy": 0.7538772940635681, + "num_tokens": 102862031.0, + "step": 44510 + }, + { + "epoch": 0.40817823416154764, + "learning_rate": 0.00011836618685248006, + "loss": 0.8771, + "mean_token_accuracy": 0.7395708858966827, + "num_tokens": 102884888.0, + "step": 44520 + }, + { + "epoch": 0.4082699184010269, + "learning_rate": 0.00011834785000458421, + "loss": 0.8437, + "mean_token_accuracy": 0.7475594997406005, + "num_tokens": 102907801.0, + "step": 44530 + }, + { + "epoch": 0.4083616026405061, + "learning_rate": 0.00011832951315668836, + "loss": 0.8337, + "mean_token_accuracy": 0.750956678390503, + "num_tokens": 102930883.0, + "step": 44540 + }, + { + "epoch": 0.40845328687998533, + "learning_rate": 0.00011831117630879252, + "loss": 0.8071, + "mean_token_accuracy": 0.756844425201416, + "num_tokens": 102954198.0, + "step": 44550 + }, + { + "epoch": 0.4085449711194646, + "learning_rate": 0.00011829283946089668, + "loss": 0.831, + "mean_token_accuracy": 0.7487766325473786, + "num_tokens": 102977390.0, + "step": 44560 + }, + { + "epoch": 0.4086366553589438, + "learning_rate": 0.00011827450261300083, + "loss": 0.8609, + "mean_token_accuracy": 0.7401157557964325, + "num_tokens": 102999947.0, + "step": 44570 + }, + { + "epoch": 0.40872833959842303, + "learning_rate": 0.00011825616576510499, + "loss": 0.8476, + "mean_token_accuracy": 0.748603880405426, + "num_tokens": 103023087.0, + "step": 44580 + }, + { + "epoch": 0.4088200238379023, + "learning_rate": 0.00011823782891720914, + "loss": 0.8179, + "mean_token_accuracy": 0.7481927216053009, + "num_tokens": 103046768.0, + "step": 44590 + }, + { + "epoch": 0.4089117080773815, + "learning_rate": 0.00011821949206931329, + "loss": 0.8276, + "mean_token_accuracy": 0.7536837041378022, + "num_tokens": 103069457.0, + "step": 44600 + }, + { + "epoch": 0.4090033923168607, + "learning_rate": 0.00011820115522141744, + "loss": 0.8702, + "mean_token_accuracy": 0.7421279847621918, + "num_tokens": 103092706.0, + "step": 44610 + }, + { + "epoch": 0.40909507655634, + "learning_rate": 0.00011818281837352159, + "loss": 0.8373, + "mean_token_accuracy": 0.7506707310676575, + "num_tokens": 103116056.0, + "step": 44620 + }, + { + "epoch": 0.40918676079581917, + "learning_rate": 0.00011816448152562576, + "loss": 0.8236, + "mean_token_accuracy": 0.7536875903606415, + "num_tokens": 103138614.0, + "step": 44630 + }, + { + "epoch": 0.4092784450352984, + "learning_rate": 0.00011814614467772991, + "loss": 0.8237, + "mean_token_accuracy": 0.7470583975315094, + "num_tokens": 103161558.0, + "step": 44640 + }, + { + "epoch": 0.40937012927477767, + "learning_rate": 0.00011812780782983406, + "loss": 0.8478, + "mean_token_accuracy": 0.74755819439888, + "num_tokens": 103183648.0, + "step": 44650 + }, + { + "epoch": 0.4094618135142569, + "learning_rate": 0.00011810947098193821, + "loss": 0.8389, + "mean_token_accuracy": 0.7449398815631867, + "num_tokens": 103207033.0, + "step": 44660 + }, + { + "epoch": 0.4095534977537361, + "learning_rate": 0.00011809113413404235, + "loss": 0.8576, + "mean_token_accuracy": 0.7453439235687256, + "num_tokens": 103230407.0, + "step": 44670 + }, + { + "epoch": 0.40964518199321537, + "learning_rate": 0.0001180727972861465, + "loss": 0.8258, + "mean_token_accuracy": 0.7497498154640198, + "num_tokens": 103254064.0, + "step": 44680 + }, + { + "epoch": 0.4097368662326946, + "learning_rate": 0.00011805446043825068, + "loss": 0.8721, + "mean_token_accuracy": 0.7430652916431427, + "num_tokens": 103277093.0, + "step": 44690 + }, + { + "epoch": 0.4098285504721738, + "learning_rate": 0.00011803612359035483, + "loss": 0.8292, + "mean_token_accuracy": 0.7504394054412842, + "num_tokens": 103300286.0, + "step": 44700 + }, + { + "epoch": 0.40992023471165306, + "learning_rate": 0.00011801778674245899, + "loss": 0.8309, + "mean_token_accuracy": 0.7491260170936584, + "num_tokens": 103323115.0, + "step": 44710 + }, + { + "epoch": 0.4100119189511323, + "learning_rate": 0.00011799944989456312, + "loss": 0.8484, + "mean_token_accuracy": 0.743862408399582, + "num_tokens": 103346547.0, + "step": 44720 + }, + { + "epoch": 0.4101036031906115, + "learning_rate": 0.00011798111304666728, + "loss": 0.8344, + "mean_token_accuracy": 0.7455031991004943, + "num_tokens": 103369733.0, + "step": 44730 + }, + { + "epoch": 0.41019528743009076, + "learning_rate": 0.00011796277619877143, + "loss": 0.8236, + "mean_token_accuracy": 0.75127472281456, + "num_tokens": 103393322.0, + "step": 44740 + }, + { + "epoch": 0.41028697166957, + "learning_rate": 0.00011794443935087558, + "loss": 0.84, + "mean_token_accuracy": 0.7439639151096344, + "num_tokens": 103416118.0, + "step": 44750 + }, + { + "epoch": 0.41037865590904926, + "learning_rate": 0.00011792610250297975, + "loss": 0.8613, + "mean_token_accuracy": 0.7476392447948456, + "num_tokens": 103438843.0, + "step": 44760 + }, + { + "epoch": 0.41047034014852846, + "learning_rate": 0.0001179077656550839, + "loss": 0.8525, + "mean_token_accuracy": 0.7453845322132111, + "num_tokens": 103461877.0, + "step": 44770 + }, + { + "epoch": 0.4105620243880077, + "learning_rate": 0.00011788942880718805, + "loss": 0.862, + "mean_token_accuracy": 0.7461943209171296, + "num_tokens": 103484793.0, + "step": 44780 + }, + { + "epoch": 0.41065370862748696, + "learning_rate": 0.0001178710919592922, + "loss": 0.8315, + "mean_token_accuracy": 0.7418680310249328, + "num_tokens": 103507457.0, + "step": 44790 + }, + { + "epoch": 0.41074539286696615, + "learning_rate": 0.00011785275511139635, + "loss": 0.8606, + "mean_token_accuracy": 0.7420167028903961, + "num_tokens": 103530696.0, + "step": 44800 + }, + { + "epoch": 0.4108370771064454, + "learning_rate": 0.0001178344182635005, + "loss": 0.843, + "mean_token_accuracy": 0.7444317817687989, + "num_tokens": 103554093.0, + "step": 44810 + }, + { + "epoch": 0.41092876134592465, + "learning_rate": 0.00011781608141560467, + "loss": 0.8196, + "mean_token_accuracy": 0.7494815468788147, + "num_tokens": 103577543.0, + "step": 44820 + }, + { + "epoch": 0.41102044558540385, + "learning_rate": 0.00011779774456770882, + "loss": 0.8898, + "mean_token_accuracy": 0.7315061092376709, + "num_tokens": 103600184.0, + "step": 44830 + }, + { + "epoch": 0.4111121298248831, + "learning_rate": 0.00011777940771981297, + "loss": 0.8826, + "mean_token_accuracy": 0.7381754636764526, + "num_tokens": 103622962.0, + "step": 44840 + }, + { + "epoch": 0.41120381406436235, + "learning_rate": 0.00011776107087191713, + "loss": 0.8139, + "mean_token_accuracy": 0.7545563101768493, + "num_tokens": 103646700.0, + "step": 44850 + }, + { + "epoch": 0.41129549830384154, + "learning_rate": 0.00011774273402402128, + "loss": 0.8044, + "mean_token_accuracy": 0.7531153202056885, + "num_tokens": 103669148.0, + "step": 44860 + }, + { + "epoch": 0.4113871825433208, + "learning_rate": 0.00011772439717612542, + "loss": 0.8984, + "mean_token_accuracy": 0.7359162330627441, + "num_tokens": 103692313.0, + "step": 44870 + }, + { + "epoch": 0.41147886678280005, + "learning_rate": 0.00011770606032822957, + "loss": 0.8649, + "mean_token_accuracy": 0.7378570258617401, + "num_tokens": 103714806.0, + "step": 44880 + }, + { + "epoch": 0.4115705510222793, + "learning_rate": 0.00011768772348033375, + "loss": 0.833, + "mean_token_accuracy": 0.7548257350921631, + "num_tokens": 103737699.0, + "step": 44890 + }, + { + "epoch": 0.4116622352617585, + "learning_rate": 0.0001176693866324379, + "loss": 0.809, + "mean_token_accuracy": 0.7526199340820312, + "num_tokens": 103760162.0, + "step": 44900 + }, + { + "epoch": 0.41175391950123774, + "learning_rate": 0.00011765104978454205, + "loss": 0.8173, + "mean_token_accuracy": 0.7497694373130799, + "num_tokens": 103782907.0, + "step": 44910 + }, + { + "epoch": 0.411845603740717, + "learning_rate": 0.00011763271293664619, + "loss": 0.8624, + "mean_token_accuracy": 0.740943992137909, + "num_tokens": 103804971.0, + "step": 44920 + }, + { + "epoch": 0.4119372879801962, + "learning_rate": 0.00011761437608875034, + "loss": 0.8649, + "mean_token_accuracy": 0.736336624622345, + "num_tokens": 103828003.0, + "step": 44930 + }, + { + "epoch": 0.41202897221967544, + "learning_rate": 0.00011759603924085449, + "loss": 0.8648, + "mean_token_accuracy": 0.7434169828891755, + "num_tokens": 103850733.0, + "step": 44940 + }, + { + "epoch": 0.4121206564591547, + "learning_rate": 0.00011757770239295867, + "loss": 0.8416, + "mean_token_accuracy": 0.7394767940044403, + "num_tokens": 103873738.0, + "step": 44950 + }, + { + "epoch": 0.4122123406986339, + "learning_rate": 0.00011755936554506281, + "loss": 0.8332, + "mean_token_accuracy": 0.7482432544231414, + "num_tokens": 103897402.0, + "step": 44960 + }, + { + "epoch": 0.41230402493811313, + "learning_rate": 0.00011754102869716696, + "loss": 0.8512, + "mean_token_accuracy": 0.7492608785629272, + "num_tokens": 103919812.0, + "step": 44970 + }, + { + "epoch": 0.4123957091775924, + "learning_rate": 0.00011752269184927111, + "loss": 0.8331, + "mean_token_accuracy": 0.7446746230125427, + "num_tokens": 103943004.0, + "step": 44980 + }, + { + "epoch": 0.4124873934170716, + "learning_rate": 0.00011750435500137527, + "loss": 0.8453, + "mean_token_accuracy": 0.742868846654892, + "num_tokens": 103966092.0, + "step": 44990 + }, + { + "epoch": 0.41257907765655083, + "learning_rate": 0.00011748601815347942, + "loss": 0.8425, + "mean_token_accuracy": 0.7450195848941803, + "num_tokens": 103988479.0, + "step": 45000 + }, + { + "epoch": 0.4126707618960301, + "learning_rate": 0.00011746768130558357, + "loss": 0.8052, + "mean_token_accuracy": 0.7531399846076965, + "num_tokens": 104012140.0, + "step": 45010 + }, + { + "epoch": 0.41276244613550933, + "learning_rate": 0.00011744934445768774, + "loss": 0.8481, + "mean_token_accuracy": 0.7497302830219269, + "num_tokens": 104035348.0, + "step": 45020 + }, + { + "epoch": 0.4128541303749885, + "learning_rate": 0.00011743100760979189, + "loss": 0.8753, + "mean_token_accuracy": 0.7362090647220612, + "num_tokens": 104058566.0, + "step": 45030 + }, + { + "epoch": 0.4129458146144678, + "learning_rate": 0.00011741267076189604, + "loss": 0.8406, + "mean_token_accuracy": 0.7523486912250519, + "num_tokens": 104081960.0, + "step": 45040 + }, + { + "epoch": 0.413037498853947, + "learning_rate": 0.00011739433391400019, + "loss": 0.8669, + "mean_token_accuracy": 0.7415791153907776, + "num_tokens": 104104438.0, + "step": 45050 + }, + { + "epoch": 0.4131291830934262, + "learning_rate": 0.00011737599706610434, + "loss": 0.8777, + "mean_token_accuracy": 0.7370117008686066, + "num_tokens": 104127169.0, + "step": 45060 + }, + { + "epoch": 0.4132208673329055, + "learning_rate": 0.00011735766021820848, + "loss": 0.857, + "mean_token_accuracy": 0.7467028617858886, + "num_tokens": 104149718.0, + "step": 45070 + }, + { + "epoch": 0.4133125515723847, + "learning_rate": 0.00011733932337031266, + "loss": 0.8588, + "mean_token_accuracy": 0.7402410984039307, + "num_tokens": 104172687.0, + "step": 45080 + }, + { + "epoch": 0.4134042358118639, + "learning_rate": 0.00011732098652241681, + "loss": 0.868, + "mean_token_accuracy": 0.7320907115936279, + "num_tokens": 104195917.0, + "step": 45090 + }, + { + "epoch": 0.41349592005134317, + "learning_rate": 0.00011730264967452096, + "loss": 0.8508, + "mean_token_accuracy": 0.7465797960758209, + "num_tokens": 104218361.0, + "step": 45100 + }, + { + "epoch": 0.4135876042908224, + "learning_rate": 0.00011728431282662512, + "loss": 0.8551, + "mean_token_accuracy": 0.74462109208107, + "num_tokens": 104241534.0, + "step": 45110 + }, + { + "epoch": 0.4136792885303016, + "learning_rate": 0.00011726597597872925, + "loss": 0.8565, + "mean_token_accuracy": 0.7477043271064758, + "num_tokens": 104263476.0, + "step": 45120 + }, + { + "epoch": 0.41377097276978086, + "learning_rate": 0.0001172476391308334, + "loss": 0.8724, + "mean_token_accuracy": 0.7380394160747528, + "num_tokens": 104286942.0, + "step": 45130 + }, + { + "epoch": 0.4138626570092601, + "learning_rate": 0.00011722930228293756, + "loss": 0.8499, + "mean_token_accuracy": 0.7433103680610657, + "num_tokens": 104310207.0, + "step": 45140 + }, + { + "epoch": 0.41395434124873937, + "learning_rate": 0.00011721096543504174, + "loss": 0.8315, + "mean_token_accuracy": 0.748098623752594, + "num_tokens": 104333051.0, + "step": 45150 + }, + { + "epoch": 0.41404602548821856, + "learning_rate": 0.00011719262858714587, + "loss": 0.8639, + "mean_token_accuracy": 0.7461417078971863, + "num_tokens": 104357050.0, + "step": 45160 + }, + { + "epoch": 0.4141377097276978, + "learning_rate": 0.00011717429173925003, + "loss": 0.873, + "mean_token_accuracy": 0.7391665399074554, + "num_tokens": 104379551.0, + "step": 45170 + }, + { + "epoch": 0.41422939396717706, + "learning_rate": 0.00011715595489135418, + "loss": 0.8391, + "mean_token_accuracy": 0.7471110463142395, + "num_tokens": 104404067.0, + "step": 45180 + }, + { + "epoch": 0.41432107820665626, + "learning_rate": 0.00011713761804345833, + "loss": 0.8575, + "mean_token_accuracy": 0.744124048948288, + "num_tokens": 104427315.0, + "step": 45190 + }, + { + "epoch": 0.4144127624461355, + "learning_rate": 0.00011711928119556248, + "loss": 0.8241, + "mean_token_accuracy": 0.7467672049999237, + "num_tokens": 104450719.0, + "step": 45200 + }, + { + "epoch": 0.41450444668561476, + "learning_rate": 0.00011710094434766665, + "loss": 0.8226, + "mean_token_accuracy": 0.7560986161231995, + "num_tokens": 104474191.0, + "step": 45210 + }, + { + "epoch": 0.41459613092509395, + "learning_rate": 0.0001170826074997708, + "loss": 0.8484, + "mean_token_accuracy": 0.7443042755126953, + "num_tokens": 104497735.0, + "step": 45220 + }, + { + "epoch": 0.4146878151645732, + "learning_rate": 0.00011706427065187495, + "loss": 0.8714, + "mean_token_accuracy": 0.7403197705745697, + "num_tokens": 104520274.0, + "step": 45230 + }, + { + "epoch": 0.41477949940405245, + "learning_rate": 0.0001170459338039791, + "loss": 0.8774, + "mean_token_accuracy": 0.7455156743526459, + "num_tokens": 104543077.0, + "step": 45240 + }, + { + "epoch": 0.4148711836435317, + "learning_rate": 0.00011702759695608326, + "loss": 0.8405, + "mean_token_accuracy": 0.7446125626564026, + "num_tokens": 104566045.0, + "step": 45250 + }, + { + "epoch": 0.4149628678830109, + "learning_rate": 0.00011700926010818741, + "loss": 0.8182, + "mean_token_accuracy": 0.7474395215511322, + "num_tokens": 104588489.0, + "step": 45260 + }, + { + "epoch": 0.41505455212249015, + "learning_rate": 0.00011699092326029155, + "loss": 0.864, + "mean_token_accuracy": 0.7484601020812989, + "num_tokens": 104611950.0, + "step": 45270 + }, + { + "epoch": 0.4151462363619694, + "learning_rate": 0.00011697258641239572, + "loss": 0.8277, + "mean_token_accuracy": 0.7526186227798461, + "num_tokens": 104635604.0, + "step": 45280 + }, + { + "epoch": 0.4152379206014486, + "learning_rate": 0.00011695424956449988, + "loss": 0.8319, + "mean_token_accuracy": 0.7496239125728608, + "num_tokens": 104658393.0, + "step": 45290 + }, + { + "epoch": 0.41532960484092785, + "learning_rate": 0.00011693591271660403, + "loss": 0.8414, + "mean_token_accuracy": 0.7488942444324493, + "num_tokens": 104681563.0, + "step": 45300 + }, + { + "epoch": 0.4154212890804071, + "learning_rate": 0.00011691757586870818, + "loss": 0.8186, + "mean_token_accuracy": 0.7454311132431031, + "num_tokens": 104705044.0, + "step": 45310 + }, + { + "epoch": 0.4155129733198863, + "learning_rate": 0.00011689923902081232, + "loss": 0.8472, + "mean_token_accuracy": 0.7493055939674378, + "num_tokens": 104727656.0, + "step": 45320 + }, + { + "epoch": 0.41560465755936554, + "learning_rate": 0.00011688090217291647, + "loss": 0.8314, + "mean_token_accuracy": 0.74879270195961, + "num_tokens": 104751145.0, + "step": 45330 + }, + { + "epoch": 0.4156963417988448, + "learning_rate": 0.00011686256532502065, + "loss": 0.8336, + "mean_token_accuracy": 0.7552003026008606, + "num_tokens": 104774820.0, + "step": 45340 + }, + { + "epoch": 0.415788026038324, + "learning_rate": 0.0001168442284771248, + "loss": 0.8507, + "mean_token_accuracy": 0.748703908920288, + "num_tokens": 104797916.0, + "step": 45350 + }, + { + "epoch": 0.41587971027780324, + "learning_rate": 0.00011682589162922894, + "loss": 0.8563, + "mean_token_accuracy": 0.7438113152980804, + "num_tokens": 104821565.0, + "step": 45360 + }, + { + "epoch": 0.4159713945172825, + "learning_rate": 0.00011680755478133309, + "loss": 0.8423, + "mean_token_accuracy": 0.7446358323097229, + "num_tokens": 104845272.0, + "step": 45370 + }, + { + "epoch": 0.41606307875676174, + "learning_rate": 0.00011678921793343724, + "loss": 0.8141, + "mean_token_accuracy": 0.7505999803543091, + "num_tokens": 104868137.0, + "step": 45380 + }, + { + "epoch": 0.41615476299624093, + "learning_rate": 0.0001167708810855414, + "loss": 0.8547, + "mean_token_accuracy": 0.7448664903640747, + "num_tokens": 104892107.0, + "step": 45390 + }, + { + "epoch": 0.4162464472357202, + "learning_rate": 0.00011675254423764555, + "loss": 0.8255, + "mean_token_accuracy": 0.7546456217765808, + "num_tokens": 104915193.0, + "step": 45400 + }, + { + "epoch": 0.41633813147519944, + "learning_rate": 0.00011673420738974971, + "loss": 0.8628, + "mean_token_accuracy": 0.7427400827407837, + "num_tokens": 104937698.0, + "step": 45410 + }, + { + "epoch": 0.41642981571467863, + "learning_rate": 0.00011671587054185386, + "loss": 0.8295, + "mean_token_accuracy": 0.7500802636146545, + "num_tokens": 104960515.0, + "step": 45420 + }, + { + "epoch": 0.4165214999541579, + "learning_rate": 0.00011669753369395802, + "loss": 0.8087, + "mean_token_accuracy": 0.7531710028648376, + "num_tokens": 104984037.0, + "step": 45430 + }, + { + "epoch": 0.41661318419363713, + "learning_rate": 0.00011667919684606217, + "loss": 0.8506, + "mean_token_accuracy": 0.7413691818714142, + "num_tokens": 105007977.0, + "step": 45440 + }, + { + "epoch": 0.4167048684331163, + "learning_rate": 0.00011666085999816632, + "loss": 0.8368, + "mean_token_accuracy": 0.7456383883953095, + "num_tokens": 105031155.0, + "step": 45450 + }, + { + "epoch": 0.4167965526725956, + "learning_rate": 0.00011664252315027047, + "loss": 0.8203, + "mean_token_accuracy": 0.7559475481510163, + "num_tokens": 105054640.0, + "step": 45460 + }, + { + "epoch": 0.4168882369120748, + "learning_rate": 0.00011662418630237464, + "loss": 0.8705, + "mean_token_accuracy": 0.7432197690010071, + "num_tokens": 105077830.0, + "step": 45470 + }, + { + "epoch": 0.416979921151554, + "learning_rate": 0.00011660584945447879, + "loss": 0.8142, + "mean_token_accuracy": 0.7596755623817444, + "num_tokens": 105100700.0, + "step": 45480 + }, + { + "epoch": 0.4170716053910333, + "learning_rate": 0.00011658751260658294, + "loss": 0.812, + "mean_token_accuracy": 0.7577692210674286, + "num_tokens": 105123057.0, + "step": 45490 + }, + { + "epoch": 0.4171632896305125, + "learning_rate": 0.00011656917575868709, + "loss": 0.8562, + "mean_token_accuracy": 0.7477727413177491, + "num_tokens": 105146667.0, + "step": 45500 + }, + { + "epoch": 0.4172549738699918, + "learning_rate": 0.00011655083891079124, + "loss": 0.8796, + "mean_token_accuracy": 0.7398671507835388, + "num_tokens": 105169653.0, + "step": 45510 + }, + { + "epoch": 0.41734665810947097, + "learning_rate": 0.00011653250206289538, + "loss": 0.8182, + "mean_token_accuracy": 0.7536071181297302, + "num_tokens": 105193215.0, + "step": 45520 + }, + { + "epoch": 0.4174383423489502, + "learning_rate": 0.00011651416521499953, + "loss": 0.8194, + "mean_token_accuracy": 0.7570696473121643, + "num_tokens": 105216210.0, + "step": 45530 + }, + { + "epoch": 0.41753002658842947, + "learning_rate": 0.00011649582836710371, + "loss": 0.8548, + "mean_token_accuracy": 0.7465242505073547, + "num_tokens": 105239689.0, + "step": 45540 + }, + { + "epoch": 0.41762171082790867, + "learning_rate": 0.00011647749151920787, + "loss": 0.8469, + "mean_token_accuracy": 0.75292107462883, + "num_tokens": 105262978.0, + "step": 45550 + }, + { + "epoch": 0.4177133950673879, + "learning_rate": 0.000116459154671312, + "loss": 0.8722, + "mean_token_accuracy": 0.7375808358192444, + "num_tokens": 105287163.0, + "step": 45560 + }, + { + "epoch": 0.41780507930686717, + "learning_rate": 0.00011644081782341616, + "loss": 0.8894, + "mean_token_accuracy": 0.7363746345043183, + "num_tokens": 105310174.0, + "step": 45570 + }, + { + "epoch": 0.41789676354634636, + "learning_rate": 0.00011642248097552031, + "loss": 0.8305, + "mean_token_accuracy": 0.7463148236274719, + "num_tokens": 105333603.0, + "step": 45580 + }, + { + "epoch": 0.4179884477858256, + "learning_rate": 0.00011640414412762446, + "loss": 0.8357, + "mean_token_accuracy": 0.7453543424606324, + "num_tokens": 105356793.0, + "step": 45590 + }, + { + "epoch": 0.41808013202530486, + "learning_rate": 0.00011638580727972861, + "loss": 0.8456, + "mean_token_accuracy": 0.7480204463005066, + "num_tokens": 105379835.0, + "step": 45600 + }, + { + "epoch": 0.41817181626478406, + "learning_rate": 0.00011636747043183278, + "loss": 0.8423, + "mean_token_accuracy": 0.7426742017269135, + "num_tokens": 105403266.0, + "step": 45610 + }, + { + "epoch": 0.4182635005042633, + "learning_rate": 0.00011634913358393693, + "loss": 0.8317, + "mean_token_accuracy": 0.7503256618976593, + "num_tokens": 105425953.0, + "step": 45620 + }, + { + "epoch": 0.41835518474374256, + "learning_rate": 0.00011633079673604108, + "loss": 0.8778, + "mean_token_accuracy": 0.7438302993774414, + "num_tokens": 105447892.0, + "step": 45630 + }, + { + "epoch": 0.4184468689832218, + "learning_rate": 0.00011631245988814523, + "loss": 0.8788, + "mean_token_accuracy": 0.7388303697109222, + "num_tokens": 105470830.0, + "step": 45640 + }, + { + "epoch": 0.418538553222701, + "learning_rate": 0.00011629412304024938, + "loss": 0.8189, + "mean_token_accuracy": 0.750828355550766, + "num_tokens": 105493417.0, + "step": 45650 + }, + { + "epoch": 0.41863023746218025, + "learning_rate": 0.00011627578619235354, + "loss": 0.8262, + "mean_token_accuracy": 0.7559551656246185, + "num_tokens": 105516431.0, + "step": 45660 + }, + { + "epoch": 0.4187219217016595, + "learning_rate": 0.0001162574493444577, + "loss": 0.8126, + "mean_token_accuracy": 0.752439683675766, + "num_tokens": 105539949.0, + "step": 45670 + }, + { + "epoch": 0.4188136059411387, + "learning_rate": 0.00011623911249656185, + "loss": 0.8461, + "mean_token_accuracy": 0.7447866261005401, + "num_tokens": 105564062.0, + "step": 45680 + }, + { + "epoch": 0.41890529018061795, + "learning_rate": 0.000116220775648666, + "loss": 0.8596, + "mean_token_accuracy": 0.7445887506008149, + "num_tokens": 105587012.0, + "step": 45690 + }, + { + "epoch": 0.4189969744200972, + "learning_rate": 0.00011620243880077016, + "loss": 0.8744, + "mean_token_accuracy": 0.7401760339736938, + "num_tokens": 105610455.0, + "step": 45700 + }, + { + "epoch": 0.4190886586595764, + "learning_rate": 0.00011618410195287431, + "loss": 0.8279, + "mean_token_accuracy": 0.7462787568569184, + "num_tokens": 105632633.0, + "step": 45710 + }, + { + "epoch": 0.41918034289905565, + "learning_rate": 0.00011616576510497845, + "loss": 0.8732, + "mean_token_accuracy": 0.7452632546424866, + "num_tokens": 105656151.0, + "step": 45720 + }, + { + "epoch": 0.4192720271385349, + "learning_rate": 0.0001161474282570826, + "loss": 0.8808, + "mean_token_accuracy": 0.7367396593093872, + "num_tokens": 105679462.0, + "step": 45730 + }, + { + "epoch": 0.4193637113780141, + "learning_rate": 0.00011612909140918678, + "loss": 0.829, + "mean_token_accuracy": 0.7499977886676789, + "num_tokens": 105702901.0, + "step": 45740 + }, + { + "epoch": 0.41945539561749334, + "learning_rate": 0.00011611075456129093, + "loss": 0.7976, + "mean_token_accuracy": 0.7562902629375458, + "num_tokens": 105726473.0, + "step": 45750 + }, + { + "epoch": 0.4195470798569726, + "learning_rate": 0.00011609241771339507, + "loss": 0.8624, + "mean_token_accuracy": 0.7390582978725433, + "num_tokens": 105749821.0, + "step": 45760 + }, + { + "epoch": 0.41963876409645184, + "learning_rate": 0.00011607408086549922, + "loss": 0.8321, + "mean_token_accuracy": 0.7496195077896118, + "num_tokens": 105773048.0, + "step": 45770 + }, + { + "epoch": 0.41973044833593104, + "learning_rate": 0.00011605574401760337, + "loss": 0.8469, + "mean_token_accuracy": 0.7463629901409149, + "num_tokens": 105796028.0, + "step": 45780 + }, + { + "epoch": 0.4198221325754103, + "learning_rate": 0.00011603740716970752, + "loss": 0.8727, + "mean_token_accuracy": 0.7390254437923431, + "num_tokens": 105819424.0, + "step": 45790 + }, + { + "epoch": 0.41991381681488954, + "learning_rate": 0.00011601907032181169, + "loss": 0.8553, + "mean_token_accuracy": 0.7427088797092438, + "num_tokens": 105842506.0, + "step": 45800 + }, + { + "epoch": 0.42000550105436874, + "learning_rate": 0.00011600073347391584, + "loss": 0.8335, + "mean_token_accuracy": 0.7487434446811676, + "num_tokens": 105865914.0, + "step": 45810 + }, + { + "epoch": 0.420097185293848, + "learning_rate": 0.00011598239662601999, + "loss": 0.8925, + "mean_token_accuracy": 0.7376970946788788, + "num_tokens": 105889179.0, + "step": 45820 + }, + { + "epoch": 0.42018886953332724, + "learning_rate": 0.00011596405977812414, + "loss": 0.7837, + "mean_token_accuracy": 0.7546100616455078, + "num_tokens": 105912235.0, + "step": 45830 + }, + { + "epoch": 0.42028055377280643, + "learning_rate": 0.0001159457229302283, + "loss": 0.8801, + "mean_token_accuracy": 0.7406101167201996, + "num_tokens": 105935843.0, + "step": 45840 + }, + { + "epoch": 0.4203722380122857, + "learning_rate": 0.00011592738608233245, + "loss": 0.8263, + "mean_token_accuracy": 0.750576651096344, + "num_tokens": 105959465.0, + "step": 45850 + }, + { + "epoch": 0.42046392225176493, + "learning_rate": 0.0001159090492344366, + "loss": 0.8815, + "mean_token_accuracy": 0.7370054364204407, + "num_tokens": 105983307.0, + "step": 45860 + }, + { + "epoch": 0.4205556064912442, + "learning_rate": 0.00011589071238654077, + "loss": 0.8643, + "mean_token_accuracy": 0.7418716788291931, + "num_tokens": 106006639.0, + "step": 45870 + }, + { + "epoch": 0.4206472907307234, + "learning_rate": 0.00011587237553864492, + "loss": 0.8715, + "mean_token_accuracy": 0.7429073452949524, + "num_tokens": 106029369.0, + "step": 45880 + }, + { + "epoch": 0.42073897497020263, + "learning_rate": 0.00011585403869074907, + "loss": 0.8253, + "mean_token_accuracy": 0.7510428845882415, + "num_tokens": 106052040.0, + "step": 45890 + }, + { + "epoch": 0.4208306592096819, + "learning_rate": 0.00011583570184285322, + "loss": 0.8779, + "mean_token_accuracy": 0.7394703567028046, + "num_tokens": 106075073.0, + "step": 45900 + }, + { + "epoch": 0.4209223434491611, + "learning_rate": 0.00011581736499495737, + "loss": 0.8392, + "mean_token_accuracy": 0.7552196383476257, + "num_tokens": 106098575.0, + "step": 45910 + }, + { + "epoch": 0.4210140276886403, + "learning_rate": 0.00011579902814706151, + "loss": 0.8484, + "mean_token_accuracy": 0.7435707151889801, + "num_tokens": 106121685.0, + "step": 45920 + }, + { + "epoch": 0.4211057119281196, + "learning_rate": 0.00011578069129916569, + "loss": 0.8587, + "mean_token_accuracy": 0.7399836182594299, + "num_tokens": 106144497.0, + "step": 45930 + }, + { + "epoch": 0.42119739616759877, + "learning_rate": 0.00011576235445126984, + "loss": 0.8864, + "mean_token_accuracy": 0.7383939027786255, + "num_tokens": 106167585.0, + "step": 45940 + }, + { + "epoch": 0.421289080407078, + "learning_rate": 0.000115744017603374, + "loss": 0.8677, + "mean_token_accuracy": 0.7396584928035737, + "num_tokens": 106190120.0, + "step": 45950 + }, + { + "epoch": 0.42138076464655727, + "learning_rate": 0.00011572568075547813, + "loss": 0.8402, + "mean_token_accuracy": 0.7479067862033844, + "num_tokens": 106212767.0, + "step": 45960 + }, + { + "epoch": 0.42147244888603647, + "learning_rate": 0.00011570734390758228, + "loss": 0.8778, + "mean_token_accuracy": 0.7405851066112519, + "num_tokens": 106234721.0, + "step": 45970 + }, + { + "epoch": 0.4215641331255157, + "learning_rate": 0.00011568900705968644, + "loss": 0.8936, + "mean_token_accuracy": 0.7409386932849884, + "num_tokens": 106257402.0, + "step": 45980 + }, + { + "epoch": 0.42165581736499497, + "learning_rate": 0.00011567067021179059, + "loss": 0.8444, + "mean_token_accuracy": 0.7518729507923126, + "num_tokens": 106280272.0, + "step": 45990 + }, + { + "epoch": 0.4217475016044742, + "learning_rate": 0.00011565233336389475, + "loss": 0.8635, + "mean_token_accuracy": 0.7428579866886139, + "num_tokens": 106303374.0, + "step": 46000 + }, + { + "epoch": 0.4218391858439534, + "learning_rate": 0.0001156339965159989, + "loss": 0.8603, + "mean_token_accuracy": 0.7387055456638336, + "num_tokens": 106326608.0, + "step": 46010 + }, + { + "epoch": 0.42193087008343266, + "learning_rate": 0.00011561565966810306, + "loss": 0.8602, + "mean_token_accuracy": 0.7429966807365418, + "num_tokens": 106350235.0, + "step": 46020 + }, + { + "epoch": 0.4220225543229119, + "learning_rate": 0.00011559732282020721, + "loss": 0.8423, + "mean_token_accuracy": 0.7473647713661193, + "num_tokens": 106373390.0, + "step": 46030 + }, + { + "epoch": 0.4221142385623911, + "learning_rate": 0.00011557898597231136, + "loss": 0.8421, + "mean_token_accuracy": 0.7498080492019653, + "num_tokens": 106397098.0, + "step": 46040 + }, + { + "epoch": 0.42220592280187036, + "learning_rate": 0.00011556064912441551, + "loss": 0.8412, + "mean_token_accuracy": 0.7453709840774536, + "num_tokens": 106420285.0, + "step": 46050 + }, + { + "epoch": 0.4222976070413496, + "learning_rate": 0.00011554231227651968, + "loss": 0.8463, + "mean_token_accuracy": 0.7433944940567017, + "num_tokens": 106442894.0, + "step": 46060 + }, + { + "epoch": 0.4223892912808288, + "learning_rate": 0.00011552397542862383, + "loss": 0.8824, + "mean_token_accuracy": 0.7417986690998077, + "num_tokens": 106465957.0, + "step": 46070 + }, + { + "epoch": 0.42248097552030806, + "learning_rate": 0.00011550563858072798, + "loss": 0.8672, + "mean_token_accuracy": 0.7395024836063385, + "num_tokens": 106488880.0, + "step": 46080 + }, + { + "epoch": 0.4225726597597873, + "learning_rate": 0.00011548730173283213, + "loss": 0.8664, + "mean_token_accuracy": 0.7445531606674194, + "num_tokens": 106512511.0, + "step": 46090 + }, + { + "epoch": 0.4226643439992665, + "learning_rate": 0.00011546896488493629, + "loss": 0.8571, + "mean_token_accuracy": 0.7428897380828857, + "num_tokens": 106536804.0, + "step": 46100 + }, + { + "epoch": 0.42275602823874575, + "learning_rate": 0.00011545062803704044, + "loss": 0.8638, + "mean_token_accuracy": 0.7499698102474213, + "num_tokens": 106559217.0, + "step": 46110 + }, + { + "epoch": 0.422847712478225, + "learning_rate": 0.00011543229118914458, + "loss": 0.8661, + "mean_token_accuracy": 0.738968962430954, + "num_tokens": 106582047.0, + "step": 46120 + }, + { + "epoch": 0.42293939671770425, + "learning_rate": 0.00011541395434124876, + "loss": 0.8288, + "mean_token_accuracy": 0.7504612803459167, + "num_tokens": 106605527.0, + "step": 46130 + }, + { + "epoch": 0.42303108095718345, + "learning_rate": 0.00011539561749335291, + "loss": 0.8498, + "mean_token_accuracy": 0.7508462846279145, + "num_tokens": 106628365.0, + "step": 46140 + }, + { + "epoch": 0.4231227651966627, + "learning_rate": 0.00011537728064545706, + "loss": 0.8522, + "mean_token_accuracy": 0.748188054561615, + "num_tokens": 106652326.0, + "step": 46150 + }, + { + "epoch": 0.42321444943614195, + "learning_rate": 0.0001153589437975612, + "loss": 0.8356, + "mean_token_accuracy": 0.7493544459342957, + "num_tokens": 106675436.0, + "step": 46160 + }, + { + "epoch": 0.42330613367562114, + "learning_rate": 0.00011534060694966535, + "loss": 0.8426, + "mean_token_accuracy": 0.7411046922206879, + "num_tokens": 106698878.0, + "step": 46170 + }, + { + "epoch": 0.4233978179151004, + "learning_rate": 0.0001153222701017695, + "loss": 0.8772, + "mean_token_accuracy": 0.7387505054473877, + "num_tokens": 106721574.0, + "step": 46180 + }, + { + "epoch": 0.42348950215457964, + "learning_rate": 0.00011530393325387368, + "loss": 0.8331, + "mean_token_accuracy": 0.7473115742206573, + "num_tokens": 106744381.0, + "step": 46190 + }, + { + "epoch": 0.42358118639405884, + "learning_rate": 0.00011528559640597782, + "loss": 0.8495, + "mean_token_accuracy": 0.7447142958641052, + "num_tokens": 106767371.0, + "step": 46200 + }, + { + "epoch": 0.4236728706335381, + "learning_rate": 0.00011526725955808197, + "loss": 0.8427, + "mean_token_accuracy": 0.750130033493042, + "num_tokens": 106790745.0, + "step": 46210 + }, + { + "epoch": 0.42376455487301734, + "learning_rate": 0.00011524892271018612, + "loss": 0.8542, + "mean_token_accuracy": 0.7497813165187835, + "num_tokens": 106814397.0, + "step": 46220 + }, + { + "epoch": 0.42385623911249654, + "learning_rate": 0.00011523058586229027, + "loss": 0.8386, + "mean_token_accuracy": 0.7483627617359161, + "num_tokens": 106837580.0, + "step": 46230 + }, + { + "epoch": 0.4239479233519758, + "learning_rate": 0.00011521224901439443, + "loss": 0.8055, + "mean_token_accuracy": 0.753358781337738, + "num_tokens": 106860740.0, + "step": 46240 + }, + { + "epoch": 0.42403960759145504, + "learning_rate": 0.00011519391216649858, + "loss": 0.835, + "mean_token_accuracy": 0.751039469242096, + "num_tokens": 106883649.0, + "step": 46250 + }, + { + "epoch": 0.4241312918309343, + "learning_rate": 0.00011517557531860274, + "loss": 0.8451, + "mean_token_accuracy": 0.7448641002178192, + "num_tokens": 106906797.0, + "step": 46260 + }, + { + "epoch": 0.4242229760704135, + "learning_rate": 0.0001151572384707069, + "loss": 0.8388, + "mean_token_accuracy": 0.7540587186813354, + "num_tokens": 106929867.0, + "step": 46270 + }, + { + "epoch": 0.42431466030989273, + "learning_rate": 0.00011513890162281105, + "loss": 0.8636, + "mean_token_accuracy": 0.7385248601436615, + "num_tokens": 106952653.0, + "step": 46280 + }, + { + "epoch": 0.424406344549372, + "learning_rate": 0.0001151205647749152, + "loss": 0.8113, + "mean_token_accuracy": 0.7544450163841248, + "num_tokens": 106975920.0, + "step": 46290 + }, + { + "epoch": 0.4244980287888512, + "learning_rate": 0.00011510222792701935, + "loss": 0.8078, + "mean_token_accuracy": 0.7519317746162415, + "num_tokens": 106998058.0, + "step": 46300 + }, + { + "epoch": 0.42458971302833043, + "learning_rate": 0.0001150838910791235, + "loss": 0.8371, + "mean_token_accuracy": 0.7469861268997192, + "num_tokens": 107021147.0, + "step": 46310 + }, + { + "epoch": 0.4246813972678097, + "learning_rate": 0.00011506555423122767, + "loss": 0.7939, + "mean_token_accuracy": 0.754490852355957, + "num_tokens": 107045031.0, + "step": 46320 + }, + { + "epoch": 0.4247730815072889, + "learning_rate": 0.00011504721738333182, + "loss": 0.862, + "mean_token_accuracy": 0.7441570162773132, + "num_tokens": 107068091.0, + "step": 46330 + }, + { + "epoch": 0.4248647657467681, + "learning_rate": 0.00011502888053543597, + "loss": 0.8453, + "mean_token_accuracy": 0.7424165308475494, + "num_tokens": 107090966.0, + "step": 46340 + }, + { + "epoch": 0.4249564499862474, + "learning_rate": 0.00011501054368754012, + "loss": 0.8389, + "mean_token_accuracy": 0.7543610811233521, + "num_tokens": 107113144.0, + "step": 46350 + }, + { + "epoch": 0.42504813422572657, + "learning_rate": 0.00011499220683964426, + "loss": 0.8709, + "mean_token_accuracy": 0.7408024132251739, + "num_tokens": 107136129.0, + "step": 46360 + }, + { + "epoch": 0.4251398184652058, + "learning_rate": 0.00011497386999174841, + "loss": 0.8228, + "mean_token_accuracy": 0.7498598039150238, + "num_tokens": 107159147.0, + "step": 46370 + }, + { + "epoch": 0.42523150270468507, + "learning_rate": 0.00011495553314385257, + "loss": 0.8403, + "mean_token_accuracy": 0.7475099742412568, + "num_tokens": 107181963.0, + "step": 46380 + }, + { + "epoch": 0.4253231869441643, + "learning_rate": 0.00011493719629595674, + "loss": 0.8558, + "mean_token_accuracy": 0.7424833416938782, + "num_tokens": 107204721.0, + "step": 46390 + }, + { + "epoch": 0.4254148711836435, + "learning_rate": 0.00011491885944806088, + "loss": 0.8519, + "mean_token_accuracy": 0.7513519704341889, + "num_tokens": 107228509.0, + "step": 46400 + }, + { + "epoch": 0.42550655542312277, + "learning_rate": 0.00011490052260016503, + "loss": 0.8497, + "mean_token_accuracy": 0.7518217444419861, + "num_tokens": 107251226.0, + "step": 46410 + }, + { + "epoch": 0.425598239662602, + "learning_rate": 0.00011488218575226919, + "loss": 0.8638, + "mean_token_accuracy": 0.7468670606613159, + "num_tokens": 107273883.0, + "step": 46420 + }, + { + "epoch": 0.4256899239020812, + "learning_rate": 0.00011486384890437334, + "loss": 0.861, + "mean_token_accuracy": 0.7417753159999847, + "num_tokens": 107297263.0, + "step": 46430 + }, + { + "epoch": 0.42578160814156046, + "learning_rate": 0.00011484551205647749, + "loss": 0.8383, + "mean_token_accuracy": 0.7486030995845795, + "num_tokens": 107320290.0, + "step": 46440 + }, + { + "epoch": 0.4258732923810397, + "learning_rate": 0.00011482717520858166, + "loss": 0.8658, + "mean_token_accuracy": 0.7476086497306824, + "num_tokens": 107343053.0, + "step": 46450 + }, + { + "epoch": 0.4259649766205189, + "learning_rate": 0.00011480883836068581, + "loss": 0.8017, + "mean_token_accuracy": 0.75301753282547, + "num_tokens": 107365837.0, + "step": 46460 + }, + { + "epoch": 0.42605666085999816, + "learning_rate": 0.00011479050151278996, + "loss": 0.8494, + "mean_token_accuracy": 0.7412908494472503, + "num_tokens": 107388408.0, + "step": 46470 + }, + { + "epoch": 0.4261483450994774, + "learning_rate": 0.00011477216466489411, + "loss": 0.8784, + "mean_token_accuracy": 0.7370311617851257, + "num_tokens": 107411871.0, + "step": 46480 + }, + { + "epoch": 0.42624002933895666, + "learning_rate": 0.00011475382781699826, + "loss": 0.858, + "mean_token_accuracy": 0.7447152078151703, + "num_tokens": 107435014.0, + "step": 46490 + }, + { + "epoch": 0.42633171357843586, + "learning_rate": 0.00011473549096910241, + "loss": 0.8148, + "mean_token_accuracy": 0.7514746487140656, + "num_tokens": 107458939.0, + "step": 46500 + }, + { + "epoch": 0.4264233978179151, + "learning_rate": 0.00011471715412120657, + "loss": 0.865, + "mean_token_accuracy": 0.7420465648174286, + "num_tokens": 107482667.0, + "step": 46510 + }, + { + "epoch": 0.42651508205739436, + "learning_rate": 0.00011469881727331073, + "loss": 0.8504, + "mean_token_accuracy": 0.742823350429535, + "num_tokens": 107505392.0, + "step": 46520 + }, + { + "epoch": 0.42660676629687355, + "learning_rate": 0.00011468048042541488, + "loss": 0.8307, + "mean_token_accuracy": 0.7505095362663269, + "num_tokens": 107528397.0, + "step": 46530 + }, + { + "epoch": 0.4266984505363528, + "learning_rate": 0.00011466214357751904, + "loss": 0.8544, + "mean_token_accuracy": 0.7376496374607087, + "num_tokens": 107551304.0, + "step": 46540 + }, + { + "epoch": 0.42679013477583205, + "learning_rate": 0.00011464380672962319, + "loss": 0.844, + "mean_token_accuracy": 0.7526470005512238, + "num_tokens": 107575383.0, + "step": 46550 + }, + { + "epoch": 0.42688181901531125, + "learning_rate": 0.00011462546988172733, + "loss": 0.8477, + "mean_token_accuracy": 0.745954406261444, + "num_tokens": 107598795.0, + "step": 46560 + }, + { + "epoch": 0.4269735032547905, + "learning_rate": 0.00011460713303383148, + "loss": 0.8275, + "mean_token_accuracy": 0.752588552236557, + "num_tokens": 107622572.0, + "step": 46570 + }, + { + "epoch": 0.42706518749426975, + "learning_rate": 0.00011458879618593566, + "loss": 0.8334, + "mean_token_accuracy": 0.7562140345573425, + "num_tokens": 107645640.0, + "step": 46580 + }, + { + "epoch": 0.42715687173374894, + "learning_rate": 0.00011457045933803981, + "loss": 0.8255, + "mean_token_accuracy": 0.7416290700435638, + "num_tokens": 107667678.0, + "step": 46590 + }, + { + "epoch": 0.4272485559732282, + "learning_rate": 0.00011455212249014395, + "loss": 0.8682, + "mean_token_accuracy": 0.7378032803535461, + "num_tokens": 107690796.0, + "step": 46600 + }, + { + "epoch": 0.42734024021270745, + "learning_rate": 0.0001145337856422481, + "loss": 0.8114, + "mean_token_accuracy": 0.7644253432750702, + "num_tokens": 107713308.0, + "step": 46610 + }, + { + "epoch": 0.4274319244521867, + "learning_rate": 0.00011451544879435225, + "loss": 0.8479, + "mean_token_accuracy": 0.7421428322792053, + "num_tokens": 107735691.0, + "step": 46620 + }, + { + "epoch": 0.4275236086916659, + "learning_rate": 0.0001144971119464564, + "loss": 0.863, + "mean_token_accuracy": 0.7498755097389221, + "num_tokens": 107758652.0, + "step": 46630 + }, + { + "epoch": 0.42761529293114514, + "learning_rate": 0.00011447877509856055, + "loss": 0.8194, + "mean_token_accuracy": 0.7523223459720612, + "num_tokens": 107781493.0, + "step": 46640 + }, + { + "epoch": 0.4277069771706244, + "learning_rate": 0.00011446043825066472, + "loss": 0.8894, + "mean_token_accuracy": 0.7344420850276947, + "num_tokens": 107804722.0, + "step": 46650 + }, + { + "epoch": 0.4277986614101036, + "learning_rate": 0.00011444210140276887, + "loss": 0.8396, + "mean_token_accuracy": 0.745812463760376, + "num_tokens": 107827444.0, + "step": 46660 + }, + { + "epoch": 0.42789034564958284, + "learning_rate": 0.00011442376455487302, + "loss": 0.8393, + "mean_token_accuracy": 0.7476184010505676, + "num_tokens": 107850960.0, + "step": 46670 + }, + { + "epoch": 0.4279820298890621, + "learning_rate": 0.00011440542770697718, + "loss": 0.8065, + "mean_token_accuracy": 0.7576253831386566, + "num_tokens": 107874184.0, + "step": 46680 + }, + { + "epoch": 0.4280737141285413, + "learning_rate": 0.00011438709085908133, + "loss": 0.8677, + "mean_token_accuracy": 0.7421083569526672, + "num_tokens": 107897879.0, + "step": 46690 + }, + { + "epoch": 0.42816539836802053, + "learning_rate": 0.00011436875401118548, + "loss": 0.8013, + "mean_token_accuracy": 0.756723302602768, + "num_tokens": 107920538.0, + "step": 46700 + }, + { + "epoch": 0.4282570826074998, + "learning_rate": 0.00011435041716328964, + "loss": 0.8377, + "mean_token_accuracy": 0.7451123595237732, + "num_tokens": 107943645.0, + "step": 46710 + }, + { + "epoch": 0.428348766846979, + "learning_rate": 0.0001143320803153938, + "loss": 0.8404, + "mean_token_accuracy": 0.7516084432601928, + "num_tokens": 107966827.0, + "step": 46720 + }, + { + "epoch": 0.42844045108645823, + "learning_rate": 0.00011431374346749795, + "loss": 0.8058, + "mean_token_accuracy": 0.7576744019985199, + "num_tokens": 107990085.0, + "step": 46730 + }, + { + "epoch": 0.4285321353259375, + "learning_rate": 0.0001142954066196021, + "loss": 0.8468, + "mean_token_accuracy": 0.7461348176002502, + "num_tokens": 108013237.0, + "step": 46740 + }, + { + "epoch": 0.42862381956541673, + "learning_rate": 0.00011427706977170625, + "loss": 0.8565, + "mean_token_accuracy": 0.7457659125328064, + "num_tokens": 108035642.0, + "step": 46750 + }, + { + "epoch": 0.4287155038048959, + "learning_rate": 0.00011425873292381039, + "loss": 0.8009, + "mean_token_accuracy": 0.7604243099689484, + "num_tokens": 108058652.0, + "step": 46760 + }, + { + "epoch": 0.4288071880443752, + "learning_rate": 0.00011424039607591454, + "loss": 0.8551, + "mean_token_accuracy": 0.7479537963867188, + "num_tokens": 108082719.0, + "step": 46770 + }, + { + "epoch": 0.4288988722838544, + "learning_rate": 0.00011422205922801872, + "loss": 0.8723, + "mean_token_accuracy": 0.7449828326702118, + "num_tokens": 108105907.0, + "step": 46780 + }, + { + "epoch": 0.4289905565233336, + "learning_rate": 0.00011420372238012287, + "loss": 0.8405, + "mean_token_accuracy": 0.747146052122116, + "num_tokens": 108128613.0, + "step": 46790 + }, + { + "epoch": 0.42908224076281287, + "learning_rate": 0.00011418538553222701, + "loss": 0.8723, + "mean_token_accuracy": 0.7421761274337768, + "num_tokens": 108151929.0, + "step": 46800 + }, + { + "epoch": 0.4291739250022921, + "learning_rate": 0.00011416704868433116, + "loss": 0.8338, + "mean_token_accuracy": 0.7516462743282318, + "num_tokens": 108174638.0, + "step": 46810 + }, + { + "epoch": 0.4292656092417713, + "learning_rate": 0.00011414871183643532, + "loss": 0.8717, + "mean_token_accuracy": 0.7379578471183776, + "num_tokens": 108198260.0, + "step": 46820 + }, + { + "epoch": 0.42935729348125057, + "learning_rate": 0.00011413037498853947, + "loss": 0.8593, + "mean_token_accuracy": 0.745039564371109, + "num_tokens": 108221876.0, + "step": 46830 + }, + { + "epoch": 0.4294489777207298, + "learning_rate": 0.00011411203814064362, + "loss": 0.8577, + "mean_token_accuracy": 0.7417080342769623, + "num_tokens": 108245244.0, + "step": 46840 + }, + { + "epoch": 0.429540661960209, + "learning_rate": 0.00011409370129274778, + "loss": 0.829, + "mean_token_accuracy": 0.7539389371871948, + "num_tokens": 108268712.0, + "step": 46850 + }, + { + "epoch": 0.42963234619968826, + "learning_rate": 0.00011407536444485194, + "loss": 0.8444, + "mean_token_accuracy": 0.7451859951019287, + "num_tokens": 108291201.0, + "step": 46860 + }, + { + "epoch": 0.4297240304391675, + "learning_rate": 0.00011405702759695609, + "loss": 0.8364, + "mean_token_accuracy": 0.7501066982746124, + "num_tokens": 108313510.0, + "step": 46870 + }, + { + "epoch": 0.42981571467864677, + "learning_rate": 0.00011403869074906024, + "loss": 0.8919, + "mean_token_accuracy": 0.736325454711914, + "num_tokens": 108336439.0, + "step": 46880 + }, + { + "epoch": 0.42990739891812596, + "learning_rate": 0.00011402035390116439, + "loss": 0.8355, + "mean_token_accuracy": 0.7490274965763092, + "num_tokens": 108359350.0, + "step": 46890 + }, + { + "epoch": 0.4299990831576052, + "learning_rate": 0.00011400201705326854, + "loss": 0.8167, + "mean_token_accuracy": 0.747568941116333, + "num_tokens": 108382543.0, + "step": 46900 + }, + { + "epoch": 0.43009076739708446, + "learning_rate": 0.00011398368020537271, + "loss": 0.8634, + "mean_token_accuracy": 0.7424772560596467, + "num_tokens": 108406241.0, + "step": 46910 + }, + { + "epoch": 0.43018245163656366, + "learning_rate": 0.00011396534335747686, + "loss": 0.8325, + "mean_token_accuracy": 0.7476962924003601, + "num_tokens": 108429123.0, + "step": 46920 + }, + { + "epoch": 0.4302741358760429, + "learning_rate": 0.00011394700650958101, + "loss": 0.8509, + "mean_token_accuracy": 0.7468082726001739, + "num_tokens": 108452949.0, + "step": 46930 + }, + { + "epoch": 0.43036582011552216, + "learning_rate": 0.00011392866966168516, + "loss": 0.8464, + "mean_token_accuracy": 0.7468827307224274, + "num_tokens": 108475489.0, + "step": 46940 + }, + { + "epoch": 0.43045750435500135, + "learning_rate": 0.00011391033281378932, + "loss": 0.844, + "mean_token_accuracy": 0.7473788142204285, + "num_tokens": 108498587.0, + "step": 46950 + }, + { + "epoch": 0.4305491885944806, + "learning_rate": 0.00011389199596589345, + "loss": 0.8111, + "mean_token_accuracy": 0.7529711425304413, + "num_tokens": 108522167.0, + "step": 46960 + }, + { + "epoch": 0.43064087283395985, + "learning_rate": 0.00011387365911799761, + "loss": 0.8235, + "mean_token_accuracy": 0.7489188611507416, + "num_tokens": 108545631.0, + "step": 46970 + }, + { + "epoch": 0.43073255707343905, + "learning_rate": 0.00011385532227010179, + "loss": 0.8478, + "mean_token_accuracy": 0.7511611342430115, + "num_tokens": 108568542.0, + "step": 46980 + }, + { + "epoch": 0.4308242413129183, + "learning_rate": 0.00011383698542220594, + "loss": 0.8559, + "mean_token_accuracy": 0.7441620111465455, + "num_tokens": 108591717.0, + "step": 46990 + }, + { + "epoch": 0.43091592555239755, + "learning_rate": 0.00011381864857431009, + "loss": 0.8292, + "mean_token_accuracy": 0.745752078294754, + "num_tokens": 108615225.0, + "step": 47000 + }, + { + "epoch": 0.4310076097918768, + "learning_rate": 0.00011380031172641423, + "loss": 0.8852, + "mean_token_accuracy": 0.7369329392910003, + "num_tokens": 108637645.0, + "step": 47010 + }, + { + "epoch": 0.431099294031356, + "learning_rate": 0.00011378197487851838, + "loss": 0.8178, + "mean_token_accuracy": 0.7573180019855499, + "num_tokens": 108661040.0, + "step": 47020 + }, + { + "epoch": 0.43119097827083525, + "learning_rate": 0.00011376363803062253, + "loss": 0.8595, + "mean_token_accuracy": 0.7456544458866119, + "num_tokens": 108684243.0, + "step": 47030 + }, + { + "epoch": 0.4312826625103145, + "learning_rate": 0.00011374530118272671, + "loss": 0.8712, + "mean_token_accuracy": 0.7465338408946991, + "num_tokens": 108707164.0, + "step": 47040 + }, + { + "epoch": 0.4313743467497937, + "learning_rate": 0.00011372696433483085, + "loss": 0.8297, + "mean_token_accuracy": 0.7447070181369781, + "num_tokens": 108729998.0, + "step": 47050 + }, + { + "epoch": 0.43146603098927294, + "learning_rate": 0.000113708627486935, + "loss": 0.8165, + "mean_token_accuracy": 0.7562990963459015, + "num_tokens": 108753120.0, + "step": 47060 + }, + { + "epoch": 0.4315577152287522, + "learning_rate": 0.00011369029063903915, + "loss": 0.8185, + "mean_token_accuracy": 0.7538254737854004, + "num_tokens": 108776661.0, + "step": 47070 + }, + { + "epoch": 0.4316493994682314, + "learning_rate": 0.0001136719537911433, + "loss": 0.8541, + "mean_token_accuracy": 0.7439543306827545, + "num_tokens": 108799474.0, + "step": 47080 + }, + { + "epoch": 0.43174108370771064, + "learning_rate": 0.00011365361694324746, + "loss": 0.8215, + "mean_token_accuracy": 0.7555378258228302, + "num_tokens": 108822375.0, + "step": 47090 + }, + { + "epoch": 0.4318327679471899, + "learning_rate": 0.00011363528009535161, + "loss": 0.8082, + "mean_token_accuracy": 0.749610298871994, + "num_tokens": 108845344.0, + "step": 47100 + }, + { + "epoch": 0.43192445218666914, + "learning_rate": 0.00011361694324745577, + "loss": 0.8228, + "mean_token_accuracy": 0.7503890573978425, + "num_tokens": 108868464.0, + "step": 47110 + }, + { + "epoch": 0.43201613642614833, + "learning_rate": 0.00011359860639955993, + "loss": 0.8153, + "mean_token_accuracy": 0.7527883887290955, + "num_tokens": 108892714.0, + "step": 47120 + }, + { + "epoch": 0.4321078206656276, + "learning_rate": 0.00011358026955166408, + "loss": 0.8289, + "mean_token_accuracy": 0.7499531209468842, + "num_tokens": 108915592.0, + "step": 47130 + }, + { + "epoch": 0.43219950490510683, + "learning_rate": 0.00011356193270376823, + "loss": 0.855, + "mean_token_accuracy": 0.744117820262909, + "num_tokens": 108939067.0, + "step": 47140 + }, + { + "epoch": 0.43229118914458603, + "learning_rate": 0.00011354359585587238, + "loss": 0.8515, + "mean_token_accuracy": 0.7455109179019928, + "num_tokens": 108962684.0, + "step": 47150 + }, + { + "epoch": 0.4323828733840653, + "learning_rate": 0.00011352525900797652, + "loss": 0.809, + "mean_token_accuracy": 0.7546250522136688, + "num_tokens": 108985648.0, + "step": 47160 + }, + { + "epoch": 0.43247455762354453, + "learning_rate": 0.0001135069221600807, + "loss": 0.8522, + "mean_token_accuracy": 0.7464926838874817, + "num_tokens": 109009257.0, + "step": 47170 + }, + { + "epoch": 0.4325662418630237, + "learning_rate": 0.00011348858531218485, + "loss": 0.8255, + "mean_token_accuracy": 0.7509628474712372, + "num_tokens": 109032839.0, + "step": 47180 + }, + { + "epoch": 0.432657926102503, + "learning_rate": 0.000113470248464289, + "loss": 0.8287, + "mean_token_accuracy": 0.7467759847640991, + "num_tokens": 109056222.0, + "step": 47190 + }, + { + "epoch": 0.4327496103419822, + "learning_rate": 0.00011345191161639315, + "loss": 0.8233, + "mean_token_accuracy": 0.7523932933807373, + "num_tokens": 109079559.0, + "step": 47200 + }, + { + "epoch": 0.4328412945814614, + "learning_rate": 0.00011343357476849729, + "loss": 0.8488, + "mean_token_accuracy": 0.751216036081314, + "num_tokens": 109103218.0, + "step": 47210 + }, + { + "epoch": 0.4329329788209407, + "learning_rate": 0.00011341523792060144, + "loss": 0.8852, + "mean_token_accuracy": 0.7350303649902343, + "num_tokens": 109126005.0, + "step": 47220 + }, + { + "epoch": 0.4330246630604199, + "learning_rate": 0.0001133969010727056, + "loss": 0.8303, + "mean_token_accuracy": 0.7465072870254517, + "num_tokens": 109148997.0, + "step": 47230 + }, + { + "epoch": 0.4331163472998992, + "learning_rate": 0.00011337856422480978, + "loss": 0.8438, + "mean_token_accuracy": 0.7420282483100891, + "num_tokens": 109172288.0, + "step": 47240 + }, + { + "epoch": 0.43320803153937837, + "learning_rate": 0.00011336022737691391, + "loss": 0.8146, + "mean_token_accuracy": 0.7545742690563202, + "num_tokens": 109196546.0, + "step": 47250 + }, + { + "epoch": 0.4332997157788576, + "learning_rate": 0.00011334189052901807, + "loss": 0.8921, + "mean_token_accuracy": 0.7386726856231689, + "num_tokens": 109219914.0, + "step": 47260 + }, + { + "epoch": 0.43339140001833687, + "learning_rate": 0.00011332355368112222, + "loss": 0.8304, + "mean_token_accuracy": 0.7491811335086822, + "num_tokens": 109243472.0, + "step": 47270 + }, + { + "epoch": 0.43348308425781606, + "learning_rate": 0.00011330521683322637, + "loss": 0.861, + "mean_token_accuracy": 0.7429771661758423, + "num_tokens": 109266778.0, + "step": 47280 + }, + { + "epoch": 0.4335747684972953, + "learning_rate": 0.00011328687998533052, + "loss": 0.8425, + "mean_token_accuracy": 0.7458553075790405, + "num_tokens": 109290212.0, + "step": 47290 + }, + { + "epoch": 0.43366645273677457, + "learning_rate": 0.00011326854313743469, + "loss": 0.867, + "mean_token_accuracy": 0.7425900459289551, + "num_tokens": 109313187.0, + "step": 47300 + }, + { + "epoch": 0.43375813697625376, + "learning_rate": 0.00011325020628953884, + "loss": 0.8091, + "mean_token_accuracy": 0.756443053483963, + "num_tokens": 109336723.0, + "step": 47310 + }, + { + "epoch": 0.433849821215733, + "learning_rate": 0.00011323186944164299, + "loss": 0.8696, + "mean_token_accuracy": 0.7415278375148773, + "num_tokens": 109360238.0, + "step": 47320 + }, + { + "epoch": 0.43394150545521226, + "learning_rate": 0.00011321353259374714, + "loss": 0.8426, + "mean_token_accuracy": 0.7460782110691071, + "num_tokens": 109383338.0, + "step": 47330 + }, + { + "epoch": 0.43403318969469146, + "learning_rate": 0.0001131951957458513, + "loss": 0.8582, + "mean_token_accuracy": 0.7424134850502014, + "num_tokens": 109406490.0, + "step": 47340 + }, + { + "epoch": 0.4341248739341707, + "learning_rate": 0.00011317685889795545, + "loss": 0.8301, + "mean_token_accuracy": 0.7553377032279969, + "num_tokens": 109429540.0, + "step": 47350 + }, + { + "epoch": 0.43421655817364996, + "learning_rate": 0.00011315852205005958, + "loss": 0.8116, + "mean_token_accuracy": 0.7546046912670136, + "num_tokens": 109452428.0, + "step": 47360 + }, + { + "epoch": 0.4343082424131292, + "learning_rate": 0.00011314018520216376, + "loss": 0.8363, + "mean_token_accuracy": 0.7467213153839112, + "num_tokens": 109475244.0, + "step": 47370 + }, + { + "epoch": 0.4343999266526084, + "learning_rate": 0.00011312184835426791, + "loss": 0.8499, + "mean_token_accuracy": 0.7427000403404236, + "num_tokens": 109498832.0, + "step": 47380 + }, + { + "epoch": 0.43449161089208765, + "learning_rate": 0.00011310351150637207, + "loss": 0.833, + "mean_token_accuracy": 0.7458879351615906, + "num_tokens": 109521803.0, + "step": 47390 + }, + { + "epoch": 0.4345832951315669, + "learning_rate": 0.00011308517465847622, + "loss": 0.8439, + "mean_token_accuracy": 0.7500184535980224, + "num_tokens": 109544973.0, + "step": 47400 + }, + { + "epoch": 0.4346749793710461, + "learning_rate": 0.00011306683781058036, + "loss": 0.8311, + "mean_token_accuracy": 0.7486188590526581, + "num_tokens": 109567935.0, + "step": 47410 + }, + { + "epoch": 0.43476666361052535, + "learning_rate": 0.00011304850096268451, + "loss": 0.8035, + "mean_token_accuracy": 0.7516610980033874, + "num_tokens": 109591707.0, + "step": 47420 + }, + { + "epoch": 0.4348583478500046, + "learning_rate": 0.00011303016411478869, + "loss": 0.8036, + "mean_token_accuracy": 0.7554397463798523, + "num_tokens": 109614822.0, + "step": 47430 + }, + { + "epoch": 0.4349500320894838, + "learning_rate": 0.00011301182726689284, + "loss": 0.8728, + "mean_token_accuracy": 0.7391930520534515, + "num_tokens": 109637931.0, + "step": 47440 + }, + { + "epoch": 0.43504171632896305, + "learning_rate": 0.00011299349041899698, + "loss": 0.8772, + "mean_token_accuracy": 0.7359247624874115, + "num_tokens": 109661019.0, + "step": 47450 + }, + { + "epoch": 0.4351334005684423, + "learning_rate": 0.00011297515357110113, + "loss": 0.8285, + "mean_token_accuracy": 0.7506414473056793, + "num_tokens": 109683416.0, + "step": 47460 + }, + { + "epoch": 0.4352250848079215, + "learning_rate": 0.00011295681672320528, + "loss": 0.8491, + "mean_token_accuracy": 0.7429089784622193, + "num_tokens": 109706303.0, + "step": 47470 + }, + { + "epoch": 0.43531676904740074, + "learning_rate": 0.00011293847987530943, + "loss": 0.8288, + "mean_token_accuracy": 0.7507230579853058, + "num_tokens": 109729845.0, + "step": 47480 + }, + { + "epoch": 0.43540845328688, + "learning_rate": 0.00011292014302741359, + "loss": 0.8876, + "mean_token_accuracy": 0.7348084867000579, + "num_tokens": 109753109.0, + "step": 47490 + }, + { + "epoch": 0.43550013752635924, + "learning_rate": 0.00011290180617951775, + "loss": 0.8278, + "mean_token_accuracy": 0.7435014486312866, + "num_tokens": 109775944.0, + "step": 47500 + }, + { + "epoch": 0.43559182176583844, + "learning_rate": 0.0001128834693316219, + "loss": 0.8863, + "mean_token_accuracy": 0.7433479726314545, + "num_tokens": 109799022.0, + "step": 47510 + }, + { + "epoch": 0.4356835060053177, + "learning_rate": 0.00011286513248372605, + "loss": 0.8715, + "mean_token_accuracy": 0.7416722118854523, + "num_tokens": 109822320.0, + "step": 47520 + }, + { + "epoch": 0.43577519024479694, + "learning_rate": 0.0001128467956358302, + "loss": 0.8673, + "mean_token_accuracy": 0.7449494242668152, + "num_tokens": 109845031.0, + "step": 47530 + }, + { + "epoch": 0.43586687448427613, + "learning_rate": 0.00011282845878793436, + "loss": 0.835, + "mean_token_accuracy": 0.7494809627532959, + "num_tokens": 109869083.0, + "step": 47540 + }, + { + "epoch": 0.4359585587237554, + "learning_rate": 0.00011281012194003851, + "loss": 0.8847, + "mean_token_accuracy": 0.7433875679969788, + "num_tokens": 109892372.0, + "step": 47550 + }, + { + "epoch": 0.43605024296323464, + "learning_rate": 0.00011279178509214268, + "loss": 0.8527, + "mean_token_accuracy": 0.7452048778533935, + "num_tokens": 109914468.0, + "step": 47560 + }, + { + "epoch": 0.43614192720271383, + "learning_rate": 0.00011277344824424683, + "loss": 0.8421, + "mean_token_accuracy": 0.7487707376480103, + "num_tokens": 109937209.0, + "step": 47570 + }, + { + "epoch": 0.4362336114421931, + "learning_rate": 0.00011275511139635098, + "loss": 0.8534, + "mean_token_accuracy": 0.7431705534458161, + "num_tokens": 109960483.0, + "step": 47580 + }, + { + "epoch": 0.43632529568167233, + "learning_rate": 0.00011273677454845513, + "loss": 0.8795, + "mean_token_accuracy": 0.7445425689220428, + "num_tokens": 109984301.0, + "step": 47590 + }, + { + "epoch": 0.4364169799211515, + "learning_rate": 0.00011271843770055928, + "loss": 0.8598, + "mean_token_accuracy": 0.7453936636447906, + "num_tokens": 110007046.0, + "step": 47600 + }, + { + "epoch": 0.4365086641606308, + "learning_rate": 0.00011270010085266342, + "loss": 0.8745, + "mean_token_accuracy": 0.7403316795825958, + "num_tokens": 110030704.0, + "step": 47610 + }, + { + "epoch": 0.43660034840011, + "learning_rate": 0.00011268176400476757, + "loss": 0.8027, + "mean_token_accuracy": 0.7546936690807342, + "num_tokens": 110053814.0, + "step": 47620 + }, + { + "epoch": 0.4366920326395893, + "learning_rate": 0.00011266342715687175, + "loss": 0.84, + "mean_token_accuracy": 0.7457985043525696, + "num_tokens": 110076518.0, + "step": 47630 + }, + { + "epoch": 0.4367837168790685, + "learning_rate": 0.0001126450903089759, + "loss": 0.8349, + "mean_token_accuracy": 0.7517504334449768, + "num_tokens": 110099414.0, + "step": 47640 + }, + { + "epoch": 0.4368754011185477, + "learning_rate": 0.00011262675346108004, + "loss": 0.8605, + "mean_token_accuracy": 0.7411771178245544, + "num_tokens": 110122327.0, + "step": 47650 + }, + { + "epoch": 0.436967085358027, + "learning_rate": 0.0001126084166131842, + "loss": 0.8344, + "mean_token_accuracy": 0.7514030754566192, + "num_tokens": 110144843.0, + "step": 47660 + }, + { + "epoch": 0.43705876959750617, + "learning_rate": 0.00011259007976528835, + "loss": 0.7993, + "mean_token_accuracy": 0.7621033012866973, + "num_tokens": 110167395.0, + "step": 47670 + }, + { + "epoch": 0.4371504538369854, + "learning_rate": 0.0001125717429173925, + "loss": 0.8609, + "mean_token_accuracy": 0.743192583322525, + "num_tokens": 110190771.0, + "step": 47680 + }, + { + "epoch": 0.43724213807646467, + "learning_rate": 0.00011255340606949666, + "loss": 0.8391, + "mean_token_accuracy": 0.7415359079837799, + "num_tokens": 110213809.0, + "step": 47690 + }, + { + "epoch": 0.43733382231594387, + "learning_rate": 0.00011253506922160082, + "loss": 0.8687, + "mean_token_accuracy": 0.7418878674507141, + "num_tokens": 110237147.0, + "step": 47700 + }, + { + "epoch": 0.4374255065554231, + "learning_rate": 0.00011251673237370497, + "loss": 0.8464, + "mean_token_accuracy": 0.744903302192688, + "num_tokens": 110260620.0, + "step": 47710 + }, + { + "epoch": 0.43751719079490237, + "learning_rate": 0.00011249839552580912, + "loss": 0.8511, + "mean_token_accuracy": 0.7429839372634888, + "num_tokens": 110283629.0, + "step": 47720 + }, + { + "epoch": 0.4376088750343816, + "learning_rate": 0.00011248005867791327, + "loss": 0.8204, + "mean_token_accuracy": 0.7538785874843598, + "num_tokens": 110307301.0, + "step": 47730 + }, + { + "epoch": 0.4377005592738608, + "learning_rate": 0.00011246172183001742, + "loss": 0.8326, + "mean_token_accuracy": 0.7453486859798432, + "num_tokens": 110331156.0, + "step": 47740 + }, + { + "epoch": 0.43779224351334006, + "learning_rate": 0.00011244338498212157, + "loss": 0.8229, + "mean_token_accuracy": 0.7505684137344361, + "num_tokens": 110353859.0, + "step": 47750 + }, + { + "epoch": 0.4378839277528193, + "learning_rate": 0.00011242504813422574, + "loss": 0.8459, + "mean_token_accuracy": 0.7491546094417572, + "num_tokens": 110376640.0, + "step": 47760 + }, + { + "epoch": 0.4379756119922985, + "learning_rate": 0.00011240671128632989, + "loss": 0.8719, + "mean_token_accuracy": 0.737398773431778, + "num_tokens": 110398873.0, + "step": 47770 + }, + { + "epoch": 0.43806729623177776, + "learning_rate": 0.00011238837443843404, + "loss": 0.8639, + "mean_token_accuracy": 0.7408490121364594, + "num_tokens": 110421782.0, + "step": 47780 + }, + { + "epoch": 0.438158980471257, + "learning_rate": 0.0001123700375905382, + "loss": 0.8472, + "mean_token_accuracy": 0.7413858413696289, + "num_tokens": 110444264.0, + "step": 47790 + }, + { + "epoch": 0.4382506647107362, + "learning_rate": 0.00011235170074264235, + "loss": 0.8096, + "mean_token_accuracy": 0.7543434023857116, + "num_tokens": 110468139.0, + "step": 47800 + }, + { + "epoch": 0.43834234895021545, + "learning_rate": 0.00011233336389474649, + "loss": 0.8252, + "mean_token_accuracy": 0.7495468199253082, + "num_tokens": 110491294.0, + "step": 47810 + }, + { + "epoch": 0.4384340331896947, + "learning_rate": 0.00011231502704685066, + "loss": 0.8393, + "mean_token_accuracy": 0.7498344779014587, + "num_tokens": 110514341.0, + "step": 47820 + }, + { + "epoch": 0.4385257174291739, + "learning_rate": 0.00011229669019895482, + "loss": 0.8297, + "mean_token_accuracy": 0.7459732294082642, + "num_tokens": 110536919.0, + "step": 47830 + }, + { + "epoch": 0.43861740166865315, + "learning_rate": 0.00011227835335105897, + "loss": 0.8193, + "mean_token_accuracy": 0.7531251728534698, + "num_tokens": 110559772.0, + "step": 47840 + }, + { + "epoch": 0.4387090859081324, + "learning_rate": 0.0001122600165031631, + "loss": 0.8598, + "mean_token_accuracy": 0.74596666097641, + "num_tokens": 110583155.0, + "step": 47850 + }, + { + "epoch": 0.43880077014761165, + "learning_rate": 0.00011224167965526726, + "loss": 0.8042, + "mean_token_accuracy": 0.7572456061840057, + "num_tokens": 110606133.0, + "step": 47860 + }, + { + "epoch": 0.43889245438709085, + "learning_rate": 0.00011222334280737141, + "loss": 0.86, + "mean_token_accuracy": 0.7468728244304657, + "num_tokens": 110629386.0, + "step": 47870 + }, + { + "epoch": 0.4389841386265701, + "learning_rate": 0.00011220500595947556, + "loss": 0.8094, + "mean_token_accuracy": 0.7484618306159974, + "num_tokens": 110652706.0, + "step": 47880 + }, + { + "epoch": 0.43907582286604935, + "learning_rate": 0.00011218666911157973, + "loss": 0.8663, + "mean_token_accuracy": 0.7431293547153472, + "num_tokens": 110676470.0, + "step": 47890 + }, + { + "epoch": 0.43916750710552854, + "learning_rate": 0.00011216833226368388, + "loss": 0.8639, + "mean_token_accuracy": 0.7359496176242828, + "num_tokens": 110698917.0, + "step": 47900 + }, + { + "epoch": 0.4392591913450078, + "learning_rate": 0.00011214999541578803, + "loss": 0.8782, + "mean_token_accuracy": 0.7332504093647003, + "num_tokens": 110722163.0, + "step": 47910 + }, + { + "epoch": 0.43935087558448704, + "learning_rate": 0.00011213165856789218, + "loss": 0.842, + "mean_token_accuracy": 0.7502342283725738, + "num_tokens": 110744412.0, + "step": 47920 + }, + { + "epoch": 0.43944255982396624, + "learning_rate": 0.00011211332171999634, + "loss": 0.8358, + "mean_token_accuracy": 0.7493318498134613, + "num_tokens": 110767155.0, + "step": 47930 + }, + { + "epoch": 0.4395342440634455, + "learning_rate": 0.00011209498487210049, + "loss": 0.8393, + "mean_token_accuracy": 0.7504944324493408, + "num_tokens": 110790698.0, + "step": 47940 + }, + { + "epoch": 0.43962592830292474, + "learning_rate": 0.00011207664802420464, + "loss": 0.8611, + "mean_token_accuracy": 0.74017373919487, + "num_tokens": 110813105.0, + "step": 47950 + }, + { + "epoch": 0.43971761254240394, + "learning_rate": 0.0001120583111763088, + "loss": 0.8906, + "mean_token_accuracy": 0.7391743063926697, + "num_tokens": 110836414.0, + "step": 47960 + }, + { + "epoch": 0.4398092967818832, + "learning_rate": 0.00011203997432841296, + "loss": 0.849, + "mean_token_accuracy": 0.7519432365894317, + "num_tokens": 110859412.0, + "step": 47970 + }, + { + "epoch": 0.43990098102136244, + "learning_rate": 0.00011202163748051711, + "loss": 0.8219, + "mean_token_accuracy": 0.7501432836055756, + "num_tokens": 110882565.0, + "step": 47980 + }, + { + "epoch": 0.4399926652608417, + "learning_rate": 0.00011200330063262126, + "loss": 0.8565, + "mean_token_accuracy": 0.7413366377353668, + "num_tokens": 110905873.0, + "step": 47990 + }, + { + "epoch": 0.4400843495003209, + "learning_rate": 0.00011198496378472541, + "loss": 0.8668, + "mean_token_accuracy": 0.7434598743915558, + "num_tokens": 110928593.0, + "step": 48000 + }, + { + "epoch": 0.44017603373980013, + "learning_rate": 0.00011196662693682955, + "loss": 0.8569, + "mean_token_accuracy": 0.7399765908718109, + "num_tokens": 110951927.0, + "step": 48010 + }, + { + "epoch": 0.4402677179792794, + "learning_rate": 0.00011194829008893373, + "loss": 0.8959, + "mean_token_accuracy": 0.7379552721977234, + "num_tokens": 110974728.0, + "step": 48020 + }, + { + "epoch": 0.4403594022187586, + "learning_rate": 0.00011192995324103788, + "loss": 0.8563, + "mean_token_accuracy": 0.7470605075359344, + "num_tokens": 110997767.0, + "step": 48030 + }, + { + "epoch": 0.44045108645823783, + "learning_rate": 0.00011191161639314203, + "loss": 0.867, + "mean_token_accuracy": 0.7417555212974548, + "num_tokens": 111020601.0, + "step": 48040 + }, + { + "epoch": 0.4405427706977171, + "learning_rate": 0.00011189327954524617, + "loss": 0.8309, + "mean_token_accuracy": 0.7526868402957916, + "num_tokens": 111044160.0, + "step": 48050 + }, + { + "epoch": 0.4406344549371963, + "learning_rate": 0.00011187494269735032, + "loss": 0.8659, + "mean_token_accuracy": 0.7407997131347657, + "num_tokens": 111066463.0, + "step": 48060 + }, + { + "epoch": 0.4407261391766755, + "learning_rate": 0.00011185660584945447, + "loss": 0.8841, + "mean_token_accuracy": 0.7373033761978149, + "num_tokens": 111089205.0, + "step": 48070 + }, + { + "epoch": 0.4408178234161548, + "learning_rate": 0.00011183826900155863, + "loss": 0.8618, + "mean_token_accuracy": 0.7385069906711579, + "num_tokens": 111113153.0, + "step": 48080 + }, + { + "epoch": 0.44090950765563397, + "learning_rate": 0.00011181993215366279, + "loss": 0.8454, + "mean_token_accuracy": 0.7498517215251923, + "num_tokens": 111136309.0, + "step": 48090 + }, + { + "epoch": 0.4410011918951132, + "learning_rate": 0.00011180159530576694, + "loss": 0.8045, + "mean_token_accuracy": 0.752761310338974, + "num_tokens": 111159628.0, + "step": 48100 + }, + { + "epoch": 0.44109287613459247, + "learning_rate": 0.0001117832584578711, + "loss": 0.8274, + "mean_token_accuracy": 0.7500851690769196, + "num_tokens": 111181301.0, + "step": 48110 + }, + { + "epoch": 0.4411845603740717, + "learning_rate": 0.00011176492160997525, + "loss": 0.8878, + "mean_token_accuracy": 0.73563272356987, + "num_tokens": 111205095.0, + "step": 48120 + }, + { + "epoch": 0.4412762446135509, + "learning_rate": 0.0001117465847620794, + "loss": 0.8276, + "mean_token_accuracy": 0.7553383767604828, + "num_tokens": 111229087.0, + "step": 48130 + }, + { + "epoch": 0.44136792885303017, + "learning_rate": 0.00011172824791418355, + "loss": 0.8027, + "mean_token_accuracy": 0.7565086603164672, + "num_tokens": 111252412.0, + "step": 48140 + }, + { + "epoch": 0.4414596130925094, + "learning_rate": 0.00011170991106628772, + "loss": 0.8535, + "mean_token_accuracy": 0.7428046345710755, + "num_tokens": 111276166.0, + "step": 48150 + }, + { + "epoch": 0.4415512973319886, + "learning_rate": 0.00011169157421839187, + "loss": 0.8743, + "mean_token_accuracy": 0.7416279554367066, + "num_tokens": 111299985.0, + "step": 48160 + }, + { + "epoch": 0.44164298157146786, + "learning_rate": 0.00011167323737049602, + "loss": 0.8538, + "mean_token_accuracy": 0.7420009493827819, + "num_tokens": 111322962.0, + "step": 48170 + }, + { + "epoch": 0.4417346658109471, + "learning_rate": 0.00011165490052260017, + "loss": 0.8049, + "mean_token_accuracy": 0.7578908443450928, + "num_tokens": 111346803.0, + "step": 48180 + }, + { + "epoch": 0.4418263500504263, + "learning_rate": 0.00011163656367470432, + "loss": 0.8412, + "mean_token_accuracy": 0.7449650347232819, + "num_tokens": 111370770.0, + "step": 48190 + }, + { + "epoch": 0.44191803428990556, + "learning_rate": 0.00011161822682680848, + "loss": 0.8753, + "mean_token_accuracy": 0.7434915244579315, + "num_tokens": 111393568.0, + "step": 48200 + }, + { + "epoch": 0.4420097185293848, + "learning_rate": 0.00011159988997891261, + "loss": 0.8212, + "mean_token_accuracy": 0.7529119253158569, + "num_tokens": 111415946.0, + "step": 48210 + }, + { + "epoch": 0.442101402768864, + "learning_rate": 0.0001115815531310168, + "loss": 0.8207, + "mean_token_accuracy": 0.7478813529014587, + "num_tokens": 111439298.0, + "step": 48220 + }, + { + "epoch": 0.44219308700834326, + "learning_rate": 0.00011156321628312095, + "loss": 0.8414, + "mean_token_accuracy": 0.7486931622028351, + "num_tokens": 111461606.0, + "step": 48230 + }, + { + "epoch": 0.4422847712478225, + "learning_rate": 0.0001115448794352251, + "loss": 0.8721, + "mean_token_accuracy": 0.734430581331253, + "num_tokens": 111485670.0, + "step": 48240 + }, + { + "epoch": 0.44237645548730176, + "learning_rate": 0.00011152654258732924, + "loss": 0.803, + "mean_token_accuracy": 0.752145254611969, + "num_tokens": 111508206.0, + "step": 48250 + }, + { + "epoch": 0.44246813972678095, + "learning_rate": 0.00011150820573943339, + "loss": 0.8162, + "mean_token_accuracy": 0.7478123664855957, + "num_tokens": 111531283.0, + "step": 48260 + }, + { + "epoch": 0.4425598239662602, + "learning_rate": 0.00011148986889153754, + "loss": 0.8832, + "mean_token_accuracy": 0.732526296377182, + "num_tokens": 111554499.0, + "step": 48270 + }, + { + "epoch": 0.44265150820573945, + "learning_rate": 0.00011147153204364172, + "loss": 0.8333, + "mean_token_accuracy": 0.7498092830181122, + "num_tokens": 111577813.0, + "step": 48280 + }, + { + "epoch": 0.44274319244521865, + "learning_rate": 0.00011145319519574586, + "loss": 0.8205, + "mean_token_accuracy": 0.7563820898532867, + "num_tokens": 111600687.0, + "step": 48290 + }, + { + "epoch": 0.4428348766846979, + "learning_rate": 0.00011143485834785001, + "loss": 0.8373, + "mean_token_accuracy": 0.7509080648422242, + "num_tokens": 111624675.0, + "step": 48300 + }, + { + "epoch": 0.44292656092417715, + "learning_rate": 0.00011141652149995416, + "loss": 0.876, + "mean_token_accuracy": 0.745772922039032, + "num_tokens": 111648130.0, + "step": 48310 + }, + { + "epoch": 0.44301824516365634, + "learning_rate": 0.00011139818465205831, + "loss": 0.8116, + "mean_token_accuracy": 0.7508679330348969, + "num_tokens": 111671383.0, + "step": 48320 + }, + { + "epoch": 0.4431099294031356, + "learning_rate": 0.00011137984780416246, + "loss": 0.8242, + "mean_token_accuracy": 0.744922548532486, + "num_tokens": 111694055.0, + "step": 48330 + }, + { + "epoch": 0.44320161364261484, + "learning_rate": 0.00011136151095626662, + "loss": 0.8701, + "mean_token_accuracy": 0.739057207107544, + "num_tokens": 111716887.0, + "step": 48340 + }, + { + "epoch": 0.4432932978820941, + "learning_rate": 0.00011134317410837078, + "loss": 0.8019, + "mean_token_accuracy": 0.755261492729187, + "num_tokens": 111740165.0, + "step": 48350 + }, + { + "epoch": 0.4433849821215733, + "learning_rate": 0.00011132483726047493, + "loss": 0.8231, + "mean_token_accuracy": 0.755534029006958, + "num_tokens": 111762941.0, + "step": 48360 + }, + { + "epoch": 0.44347666636105254, + "learning_rate": 0.00011130650041257909, + "loss": 0.8429, + "mean_token_accuracy": 0.7432640075683594, + "num_tokens": 111786033.0, + "step": 48370 + }, + { + "epoch": 0.4435683506005318, + "learning_rate": 0.00011128816356468324, + "loss": 0.8586, + "mean_token_accuracy": 0.7367870032787323, + "num_tokens": 111809438.0, + "step": 48380 + }, + { + "epoch": 0.443660034840011, + "learning_rate": 0.00011126982671678739, + "loss": 0.8162, + "mean_token_accuracy": 0.7507876813411712, + "num_tokens": 111832186.0, + "step": 48390 + }, + { + "epoch": 0.44375171907949024, + "learning_rate": 0.00011125148986889154, + "loss": 0.8456, + "mean_token_accuracy": 0.7526997089385986, + "num_tokens": 111855065.0, + "step": 48400 + }, + { + "epoch": 0.4438434033189695, + "learning_rate": 0.0001112331530209957, + "loss": 0.8694, + "mean_token_accuracy": 0.7352891981601715, + "num_tokens": 111878264.0, + "step": 48410 + }, + { + "epoch": 0.4439350875584487, + "learning_rate": 0.00011121481617309986, + "loss": 0.8475, + "mean_token_accuracy": 0.7428710043430329, + "num_tokens": 111900964.0, + "step": 48420 + }, + { + "epoch": 0.44402677179792793, + "learning_rate": 0.00011119647932520401, + "loss": 0.8669, + "mean_token_accuracy": 0.7485485553741456, + "num_tokens": 111924686.0, + "step": 48430 + }, + { + "epoch": 0.4441184560374072, + "learning_rate": 0.00011117814247730816, + "loss": 0.8378, + "mean_token_accuracy": 0.7454011261463165, + "num_tokens": 111947085.0, + "step": 48440 + }, + { + "epoch": 0.4442101402768864, + "learning_rate": 0.0001111598056294123, + "loss": 0.7867, + "mean_token_accuracy": 0.762846690416336, + "num_tokens": 111969613.0, + "step": 48450 + }, + { + "epoch": 0.44430182451636563, + "learning_rate": 0.00011114146878151645, + "loss": 0.8488, + "mean_token_accuracy": 0.747734671831131, + "num_tokens": 111992591.0, + "step": 48460 + }, + { + "epoch": 0.4443935087558449, + "learning_rate": 0.0001111231319336206, + "loss": 0.8375, + "mean_token_accuracy": 0.7515955924987793, + "num_tokens": 112015781.0, + "step": 48470 + }, + { + "epoch": 0.44448519299532413, + "learning_rate": 0.00011110479508572478, + "loss": 0.8622, + "mean_token_accuracy": 0.739305853843689, + "num_tokens": 112038556.0, + "step": 48480 + }, + { + "epoch": 0.4445768772348033, + "learning_rate": 0.00011108645823782892, + "loss": 0.8199, + "mean_token_accuracy": 0.7545050203800201, + "num_tokens": 112061245.0, + "step": 48490 + }, + { + "epoch": 0.4446685614742826, + "learning_rate": 0.00011106812138993307, + "loss": 0.8519, + "mean_token_accuracy": 0.7491310596466064, + "num_tokens": 112084157.0, + "step": 48500 + }, + { + "epoch": 0.4447602457137618, + "learning_rate": 0.00011104978454203722, + "loss": 0.846, + "mean_token_accuracy": 0.743950366973877, + "num_tokens": 112106816.0, + "step": 48510 + }, + { + "epoch": 0.444851929953241, + "learning_rate": 0.00011103144769414138, + "loss": 0.8651, + "mean_token_accuracy": 0.7435440301895142, + "num_tokens": 112130547.0, + "step": 48520 + }, + { + "epoch": 0.44494361419272027, + "learning_rate": 0.00011101311084624553, + "loss": 0.8379, + "mean_token_accuracy": 0.7546590387821197, + "num_tokens": 112153080.0, + "step": 48530 + }, + { + "epoch": 0.4450352984321995, + "learning_rate": 0.0001109947739983497, + "loss": 0.8332, + "mean_token_accuracy": 0.7477194607257843, + "num_tokens": 112175546.0, + "step": 48540 + }, + { + "epoch": 0.4451269826716787, + "learning_rate": 0.00011097643715045385, + "loss": 0.8207, + "mean_token_accuracy": 0.7554192423820496, + "num_tokens": 112199320.0, + "step": 48550 + }, + { + "epoch": 0.44521866691115797, + "learning_rate": 0.000110958100302558, + "loss": 0.8245, + "mean_token_accuracy": 0.7486271440982819, + "num_tokens": 112222922.0, + "step": 48560 + }, + { + "epoch": 0.4453103511506372, + "learning_rate": 0.00011093976345466215, + "loss": 0.8, + "mean_token_accuracy": 0.7520759165287018, + "num_tokens": 112246848.0, + "step": 48570 + }, + { + "epoch": 0.4454020353901164, + "learning_rate": 0.0001109214266067663, + "loss": 0.8281, + "mean_token_accuracy": 0.7456780135631561, + "num_tokens": 112270313.0, + "step": 48580 + }, + { + "epoch": 0.44549371962959566, + "learning_rate": 0.00011090308975887045, + "loss": 0.8382, + "mean_token_accuracy": 0.7441405475139617, + "num_tokens": 112293406.0, + "step": 48590 + }, + { + "epoch": 0.4455854038690749, + "learning_rate": 0.0001108847529109746, + "loss": 0.885, + "mean_token_accuracy": 0.7378743767738343, + "num_tokens": 112316479.0, + "step": 48600 + }, + { + "epoch": 0.44567708810855416, + "learning_rate": 0.00011086641606307877, + "loss": 0.8191, + "mean_token_accuracy": 0.7532954156398773, + "num_tokens": 112339542.0, + "step": 48610 + }, + { + "epoch": 0.44576877234803336, + "learning_rate": 0.00011084807921518292, + "loss": 0.8242, + "mean_token_accuracy": 0.7503843426704406, + "num_tokens": 112362658.0, + "step": 48620 + }, + { + "epoch": 0.4458604565875126, + "learning_rate": 0.00011082974236728707, + "loss": 0.8274, + "mean_token_accuracy": 0.7489453911781311, + "num_tokens": 112385581.0, + "step": 48630 + }, + { + "epoch": 0.44595214082699186, + "learning_rate": 0.00011081140551939123, + "loss": 0.8532, + "mean_token_accuracy": 0.7436773359775544, + "num_tokens": 112408418.0, + "step": 48640 + }, + { + "epoch": 0.44604382506647106, + "learning_rate": 0.00011079306867149536, + "loss": 0.8639, + "mean_token_accuracy": 0.7423886835575104, + "num_tokens": 112431512.0, + "step": 48650 + }, + { + "epoch": 0.4461355093059503, + "learning_rate": 0.00011077473182359952, + "loss": 0.8121, + "mean_token_accuracy": 0.7494610130786896, + "num_tokens": 112454697.0, + "step": 48660 + }, + { + "epoch": 0.44622719354542956, + "learning_rate": 0.0001107563949757037, + "loss": 0.8543, + "mean_token_accuracy": 0.746228039264679, + "num_tokens": 112478021.0, + "step": 48670 + }, + { + "epoch": 0.44631887778490875, + "learning_rate": 0.00011073805812780785, + "loss": 0.8319, + "mean_token_accuracy": 0.7489956200122834, + "num_tokens": 112500980.0, + "step": 48680 + }, + { + "epoch": 0.446410562024388, + "learning_rate": 0.00011071972127991199, + "loss": 0.8488, + "mean_token_accuracy": 0.746698260307312, + "num_tokens": 112524369.0, + "step": 48690 + }, + { + "epoch": 0.44650224626386725, + "learning_rate": 0.00011070138443201614, + "loss": 0.8455, + "mean_token_accuracy": 0.7442999124526978, + "num_tokens": 112548066.0, + "step": 48700 + }, + { + "epoch": 0.44659393050334645, + "learning_rate": 0.00011068304758412029, + "loss": 0.8301, + "mean_token_accuracy": 0.7480234801769257, + "num_tokens": 112571076.0, + "step": 48710 + }, + { + "epoch": 0.4466856147428257, + "learning_rate": 0.00011066471073622444, + "loss": 0.842, + "mean_token_accuracy": 0.7521705389022827, + "num_tokens": 112594507.0, + "step": 48720 + }, + { + "epoch": 0.44677729898230495, + "learning_rate": 0.00011064637388832859, + "loss": 0.8272, + "mean_token_accuracy": 0.7517581045627594, + "num_tokens": 112618156.0, + "step": 48730 + }, + { + "epoch": 0.4468689832217842, + "learning_rate": 0.00011062803704043276, + "loss": 0.8267, + "mean_token_accuracy": 0.7492414057254791, + "num_tokens": 112642309.0, + "step": 48740 + }, + { + "epoch": 0.4469606674612634, + "learning_rate": 0.00011060970019253691, + "loss": 0.7948, + "mean_token_accuracy": 0.7600102841854095, + "num_tokens": 112665549.0, + "step": 48750 + }, + { + "epoch": 0.44705235170074265, + "learning_rate": 0.00011059136334464106, + "loss": 0.8529, + "mean_token_accuracy": 0.7448238372802735, + "num_tokens": 112688820.0, + "step": 48760 + }, + { + "epoch": 0.4471440359402219, + "learning_rate": 0.00011057302649674521, + "loss": 0.7746, + "mean_token_accuracy": 0.7631296992301941, + "num_tokens": 112711825.0, + "step": 48770 + }, + { + "epoch": 0.4472357201797011, + "learning_rate": 0.00011055468964884937, + "loss": 0.8449, + "mean_token_accuracy": 0.7509827733039856, + "num_tokens": 112735456.0, + "step": 48780 + }, + { + "epoch": 0.44732740441918034, + "learning_rate": 0.00011053635280095352, + "loss": 0.8539, + "mean_token_accuracy": 0.7425627887248993, + "num_tokens": 112758342.0, + "step": 48790 + }, + { + "epoch": 0.4474190886586596, + "learning_rate": 0.00011051801595305768, + "loss": 0.8925, + "mean_token_accuracy": 0.7421483218669891, + "num_tokens": 112781609.0, + "step": 48800 + }, + { + "epoch": 0.4475107728981388, + "learning_rate": 0.00011049967910516184, + "loss": 0.864, + "mean_token_accuracy": 0.7388948678970337, + "num_tokens": 112804584.0, + "step": 48810 + }, + { + "epoch": 0.44760245713761804, + "learning_rate": 0.00011048134225726599, + "loss": 0.8518, + "mean_token_accuracy": 0.7474654912948608, + "num_tokens": 112827395.0, + "step": 48820 + }, + { + "epoch": 0.4476941413770973, + "learning_rate": 0.00011046300540937014, + "loss": 0.8375, + "mean_token_accuracy": 0.7417679548263549, + "num_tokens": 112851109.0, + "step": 48830 + }, + { + "epoch": 0.4477858256165765, + "learning_rate": 0.00011044466856147429, + "loss": 0.8388, + "mean_token_accuracy": 0.7523158729076386, + "num_tokens": 112874602.0, + "step": 48840 + }, + { + "epoch": 0.44787750985605573, + "learning_rate": 0.00011042633171357843, + "loss": 0.8596, + "mean_token_accuracy": 0.7469957709312439, + "num_tokens": 112897642.0, + "step": 48850 + }, + { + "epoch": 0.447969194095535, + "learning_rate": 0.00011040799486568258, + "loss": 0.8798, + "mean_token_accuracy": 0.7374691367149353, + "num_tokens": 112921366.0, + "step": 48860 + }, + { + "epoch": 0.44806087833501423, + "learning_rate": 0.00011038965801778676, + "loss": 0.833, + "mean_token_accuracy": 0.7467567145824432, + "num_tokens": 112944561.0, + "step": 48870 + }, + { + "epoch": 0.44815256257449343, + "learning_rate": 0.00011037132116989091, + "loss": 0.8436, + "mean_token_accuracy": 0.747118490934372, + "num_tokens": 112967862.0, + "step": 48880 + }, + { + "epoch": 0.4482442468139727, + "learning_rate": 0.00011035298432199505, + "loss": 0.8251, + "mean_token_accuracy": 0.7517585754394531, + "num_tokens": 112990840.0, + "step": 48890 + }, + { + "epoch": 0.44833593105345193, + "learning_rate": 0.0001103346474740992, + "loss": 0.8541, + "mean_token_accuracy": 0.7512996613979339, + "num_tokens": 113014034.0, + "step": 48900 + }, + { + "epoch": 0.4484276152929311, + "learning_rate": 0.00011031631062620335, + "loss": 0.8539, + "mean_token_accuracy": 0.7437214195728302, + "num_tokens": 113037423.0, + "step": 48910 + }, + { + "epoch": 0.4485192995324104, + "learning_rate": 0.0001102979737783075, + "loss": 0.8396, + "mean_token_accuracy": 0.7485715508460998, + "num_tokens": 113061167.0, + "step": 48920 + }, + { + "epoch": 0.4486109837718896, + "learning_rate": 0.00011027963693041168, + "loss": 0.8486, + "mean_token_accuracy": 0.7500149130821228, + "num_tokens": 113084455.0, + "step": 48930 + }, + { + "epoch": 0.4487026680113688, + "learning_rate": 0.00011026130008251582, + "loss": 0.8333, + "mean_token_accuracy": 0.742855429649353, + "num_tokens": 113107016.0, + "step": 48940 + }, + { + "epoch": 0.44879435225084807, + "learning_rate": 0.00011024296323461997, + "loss": 0.8603, + "mean_token_accuracy": 0.743027514219284, + "num_tokens": 113129446.0, + "step": 48950 + }, + { + "epoch": 0.4488860364903273, + "learning_rate": 0.00011022462638672413, + "loss": 0.8164, + "mean_token_accuracy": 0.7533604979515076, + "num_tokens": 113152457.0, + "step": 48960 + }, + { + "epoch": 0.4489777207298066, + "learning_rate": 0.00011020628953882828, + "loss": 0.8203, + "mean_token_accuracy": 0.7508922159671784, + "num_tokens": 113176081.0, + "step": 48970 + }, + { + "epoch": 0.44906940496928577, + "learning_rate": 0.00011018795269093243, + "loss": 0.8663, + "mean_token_accuracy": 0.7423801779747009, + "num_tokens": 113199096.0, + "step": 48980 + }, + { + "epoch": 0.449161089208765, + "learning_rate": 0.00011016961584303658, + "loss": 0.8227, + "mean_token_accuracy": 0.7502870976924896, + "num_tokens": 113223453.0, + "step": 48990 + }, + { + "epoch": 0.44925277344824427, + "learning_rate": 0.00011015127899514075, + "loss": 0.8709, + "mean_token_accuracy": 0.7444837629795075, + "num_tokens": 113246436.0, + "step": 49000 + }, + { + "epoch": 0.44934445768772346, + "learning_rate": 0.0001101329421472449, + "loss": 0.8286, + "mean_token_accuracy": 0.7501603424549103, + "num_tokens": 113269700.0, + "step": 49010 + }, + { + "epoch": 0.4494361419272027, + "learning_rate": 0.00011011460529934905, + "loss": 0.8225, + "mean_token_accuracy": 0.7534201204776764, + "num_tokens": 113293917.0, + "step": 49020 + }, + { + "epoch": 0.44952782616668197, + "learning_rate": 0.0001100962684514532, + "loss": 0.8452, + "mean_token_accuracy": 0.748278695344925, + "num_tokens": 113316884.0, + "step": 49030 + }, + { + "epoch": 0.44961951040616116, + "learning_rate": 0.00011007793160355736, + "loss": 0.8707, + "mean_token_accuracy": 0.744801926612854, + "num_tokens": 113340314.0, + "step": 49040 + }, + { + "epoch": 0.4497111946456404, + "learning_rate": 0.0001100595947556615, + "loss": 0.8447, + "mean_token_accuracy": 0.7505634129047394, + "num_tokens": 113363471.0, + "step": 49050 + }, + { + "epoch": 0.44980287888511966, + "learning_rate": 0.00011004125790776567, + "loss": 0.8275, + "mean_token_accuracy": 0.7532466113567352, + "num_tokens": 113386679.0, + "step": 49060 + }, + { + "epoch": 0.44989456312459886, + "learning_rate": 0.00011002292105986982, + "loss": 0.864, + "mean_token_accuracy": 0.7395869612693786, + "num_tokens": 113410078.0, + "step": 49070 + }, + { + "epoch": 0.4499862473640781, + "learning_rate": 0.00011000458421197398, + "loss": 0.837, + "mean_token_accuracy": 0.7496163547039032, + "num_tokens": 113433602.0, + "step": 49080 + }, + { + "epoch": 0.45007793160355736, + "learning_rate": 0.00010998624736407811, + "loss": 0.8174, + "mean_token_accuracy": 0.7479480087757111, + "num_tokens": 113455785.0, + "step": 49090 + }, + { + "epoch": 0.4501696158430366, + "learning_rate": 0.00010996791051618227, + "loss": 0.8109, + "mean_token_accuracy": 0.7530344069004059, + "num_tokens": 113479378.0, + "step": 49100 + }, + { + "epoch": 0.4502613000825158, + "learning_rate": 0.00010994957366828642, + "loss": 0.8544, + "mean_token_accuracy": 0.7382154881954193, + "num_tokens": 113503006.0, + "step": 49110 + }, + { + "epoch": 0.45035298432199505, + "learning_rate": 0.00010993123682039057, + "loss": 0.8161, + "mean_token_accuracy": 0.7520354568958283, + "num_tokens": 113526408.0, + "step": 49120 + }, + { + "epoch": 0.4504446685614743, + "learning_rate": 0.00010991289997249475, + "loss": 0.8194, + "mean_token_accuracy": 0.7565617859363556, + "num_tokens": 113549645.0, + "step": 49130 + }, + { + "epoch": 0.4505363528009535, + "learning_rate": 0.00010989456312459889, + "loss": 0.867, + "mean_token_accuracy": 0.7475900232791901, + "num_tokens": 113572660.0, + "step": 49140 + }, + { + "epoch": 0.45062803704043275, + "learning_rate": 0.00010987622627670304, + "loss": 0.842, + "mean_token_accuracy": 0.7509126484394073, + "num_tokens": 113595738.0, + "step": 49150 + }, + { + "epoch": 0.450719721279912, + "learning_rate": 0.00010985788942880719, + "loss": 0.8846, + "mean_token_accuracy": 0.7325856447219848, + "num_tokens": 113618373.0, + "step": 49160 + }, + { + "epoch": 0.4508114055193912, + "learning_rate": 0.00010983955258091134, + "loss": 0.8355, + "mean_token_accuracy": 0.755406379699707, + "num_tokens": 113641563.0, + "step": 49170 + }, + { + "epoch": 0.45090308975887045, + "learning_rate": 0.0001098212157330155, + "loss": 0.8411, + "mean_token_accuracy": 0.7422263979911804, + "num_tokens": 113665643.0, + "step": 49180 + }, + { + "epoch": 0.4509947739983497, + "learning_rate": 0.00010980287888511965, + "loss": 0.85, + "mean_token_accuracy": 0.7456914603710174, + "num_tokens": 113688658.0, + "step": 49190 + }, + { + "epoch": 0.4510864582378289, + "learning_rate": 0.00010978454203722381, + "loss": 0.8761, + "mean_token_accuracy": 0.7379150867462159, + "num_tokens": 113711771.0, + "step": 49200 + }, + { + "epoch": 0.45117814247730814, + "learning_rate": 0.00010976620518932796, + "loss": 0.8219, + "mean_token_accuracy": 0.750760293006897, + "num_tokens": 113734772.0, + "step": 49210 + }, + { + "epoch": 0.4512698267167874, + "learning_rate": 0.00010974786834143212, + "loss": 0.8573, + "mean_token_accuracy": 0.7350454568862915, + "num_tokens": 113757914.0, + "step": 49220 + }, + { + "epoch": 0.45136151095626664, + "learning_rate": 0.00010972953149353627, + "loss": 0.797, + "mean_token_accuracy": 0.7552305936813355, + "num_tokens": 113780439.0, + "step": 49230 + }, + { + "epoch": 0.45145319519574584, + "learning_rate": 0.00010971119464564042, + "loss": 0.8196, + "mean_token_accuracy": 0.7575195908546448, + "num_tokens": 113803385.0, + "step": 49240 + }, + { + "epoch": 0.4515448794352251, + "learning_rate": 0.00010969285779774456, + "loss": 0.8887, + "mean_token_accuracy": 0.7384458303451538, + "num_tokens": 113826477.0, + "step": 49250 + }, + { + "epoch": 0.45163656367470434, + "learning_rate": 0.00010967452094984874, + "loss": 0.8369, + "mean_token_accuracy": 0.7467671036720276, + "num_tokens": 113850545.0, + "step": 49260 + }, + { + "epoch": 0.45172824791418353, + "learning_rate": 0.00010965618410195289, + "loss": 0.8208, + "mean_token_accuracy": 0.7519316792488098, + "num_tokens": 113874981.0, + "step": 49270 + }, + { + "epoch": 0.4518199321536628, + "learning_rate": 0.00010963784725405704, + "loss": 0.829, + "mean_token_accuracy": 0.7524272322654724, + "num_tokens": 113897540.0, + "step": 49280 + }, + { + "epoch": 0.45191161639314203, + "learning_rate": 0.00010961951040616118, + "loss": 0.8668, + "mean_token_accuracy": 0.739130049943924, + "num_tokens": 113921403.0, + "step": 49290 + }, + { + "epoch": 0.45200330063262123, + "learning_rate": 0.00010960117355826533, + "loss": 0.8245, + "mean_token_accuracy": 0.7519500851631165, + "num_tokens": 113944458.0, + "step": 49300 + }, + { + "epoch": 0.4520949848721005, + "learning_rate": 0.00010958283671036948, + "loss": 0.8246, + "mean_token_accuracy": 0.751862770318985, + "num_tokens": 113967690.0, + "step": 49310 + }, + { + "epoch": 0.45218666911157973, + "learning_rate": 0.00010956449986247363, + "loss": 0.8458, + "mean_token_accuracy": 0.7447650969028473, + "num_tokens": 113991343.0, + "step": 49320 + }, + { + "epoch": 0.4522783533510589, + "learning_rate": 0.00010954616301457781, + "loss": 0.8986, + "mean_token_accuracy": 0.7406126022338867, + "num_tokens": 114014515.0, + "step": 49330 + }, + { + "epoch": 0.4523700375905382, + "learning_rate": 0.00010952782616668195, + "loss": 0.8292, + "mean_token_accuracy": 0.749345576763153, + "num_tokens": 114037608.0, + "step": 49340 + }, + { + "epoch": 0.4524617218300174, + "learning_rate": 0.0001095094893187861, + "loss": 0.8354, + "mean_token_accuracy": 0.7491923153400422, + "num_tokens": 114061200.0, + "step": 49350 + }, + { + "epoch": 0.4525534060694967, + "learning_rate": 0.00010949115247089026, + "loss": 0.8482, + "mean_token_accuracy": 0.7426029682159424, + "num_tokens": 114084074.0, + "step": 49360 + }, + { + "epoch": 0.4526450903089759, + "learning_rate": 0.00010947281562299441, + "loss": 0.8104, + "mean_token_accuracy": 0.7577181577682495, + "num_tokens": 114107740.0, + "step": 49370 + }, + { + "epoch": 0.4527367745484551, + "learning_rate": 0.00010945447877509856, + "loss": 0.823, + "mean_token_accuracy": 0.7490709841251373, + "num_tokens": 114130569.0, + "step": 49380 + }, + { + "epoch": 0.4528284587879344, + "learning_rate": 0.00010943614192720272, + "loss": 0.812, + "mean_token_accuracy": 0.7540494084358216, + "num_tokens": 114154651.0, + "step": 49390 + }, + { + "epoch": 0.45292014302741357, + "learning_rate": 0.00010941780507930688, + "loss": 0.8759, + "mean_token_accuracy": 0.7451411008834838, + "num_tokens": 114177721.0, + "step": 49400 + }, + { + "epoch": 0.4530118272668928, + "learning_rate": 0.00010939946823141103, + "loss": 0.8165, + "mean_token_accuracy": 0.7556455373764038, + "num_tokens": 114200656.0, + "step": 49410 + }, + { + "epoch": 0.45310351150637207, + "learning_rate": 0.00010938113138351518, + "loss": 0.8431, + "mean_token_accuracy": 0.7506132960319519, + "num_tokens": 114224071.0, + "step": 49420 + }, + { + "epoch": 0.45319519574585126, + "learning_rate": 0.00010936279453561933, + "loss": 0.8505, + "mean_token_accuracy": 0.746786379814148, + "num_tokens": 114247298.0, + "step": 49430 + }, + { + "epoch": 0.4532868799853305, + "learning_rate": 0.00010934445768772348, + "loss": 0.8104, + "mean_token_accuracy": 0.7564125180244445, + "num_tokens": 114269942.0, + "step": 49440 + }, + { + "epoch": 0.45337856422480977, + "learning_rate": 0.00010932612083982762, + "loss": 0.8259, + "mean_token_accuracy": 0.7480632960796356, + "num_tokens": 114293166.0, + "step": 49450 + }, + { + "epoch": 0.453470248464289, + "learning_rate": 0.0001093077839919318, + "loss": 0.8311, + "mean_token_accuracy": 0.7524271965026855, + "num_tokens": 114316551.0, + "step": 49460 + }, + { + "epoch": 0.4535619327037682, + "learning_rate": 0.00010928944714403595, + "loss": 0.8592, + "mean_token_accuracy": 0.742966377735138, + "num_tokens": 114339708.0, + "step": 49470 + }, + { + "epoch": 0.45365361694324746, + "learning_rate": 0.0001092711102961401, + "loss": 0.8483, + "mean_token_accuracy": 0.7440168797969818, + "num_tokens": 114363328.0, + "step": 49480 + }, + { + "epoch": 0.4537453011827267, + "learning_rate": 0.00010925277344824424, + "loss": 0.8145, + "mean_token_accuracy": 0.7530664384365082, + "num_tokens": 114386281.0, + "step": 49490 + }, + { + "epoch": 0.4538369854222059, + "learning_rate": 0.0001092344366003484, + "loss": 0.8144, + "mean_token_accuracy": 0.7575432062149048, + "num_tokens": 114409297.0, + "step": 49500 + }, + { + "epoch": 0.45392866966168516, + "learning_rate": 0.00010921609975245255, + "loss": 0.8343, + "mean_token_accuracy": 0.7455037117004395, + "num_tokens": 114432655.0, + "step": 49510 + }, + { + "epoch": 0.4540203539011644, + "learning_rate": 0.00010919776290455673, + "loss": 0.8576, + "mean_token_accuracy": 0.7393884003162384, + "num_tokens": 114455275.0, + "step": 49520 + }, + { + "epoch": 0.4541120381406436, + "learning_rate": 0.00010917942605666088, + "loss": 0.8332, + "mean_token_accuracy": 0.746986186504364, + "num_tokens": 114478223.0, + "step": 49530 + }, + { + "epoch": 0.45420372238012285, + "learning_rate": 0.00010916108920876502, + "loss": 0.8317, + "mean_token_accuracy": 0.7462375462055206, + "num_tokens": 114501432.0, + "step": 49540 + }, + { + "epoch": 0.4542954066196021, + "learning_rate": 0.00010914275236086917, + "loss": 0.8068, + "mean_token_accuracy": 0.7507108628749848, + "num_tokens": 114524940.0, + "step": 49550 + }, + { + "epoch": 0.4543870908590813, + "learning_rate": 0.00010912441551297332, + "loss": 0.8599, + "mean_token_accuracy": 0.7398683190345764, + "num_tokens": 114547775.0, + "step": 49560 + }, + { + "epoch": 0.45447877509856055, + "learning_rate": 0.00010910607866507747, + "loss": 0.851, + "mean_token_accuracy": 0.7424595952033997, + "num_tokens": 114570577.0, + "step": 49570 + }, + { + "epoch": 0.4545704593380398, + "learning_rate": 0.00010908774181718162, + "loss": 0.8313, + "mean_token_accuracy": 0.7421681165695191, + "num_tokens": 114593620.0, + "step": 49580 + }, + { + "epoch": 0.45466214357751905, + "learning_rate": 0.00010906940496928579, + "loss": 0.833, + "mean_token_accuracy": 0.7452627182006836, + "num_tokens": 114616443.0, + "step": 49590 + }, + { + "epoch": 0.45475382781699825, + "learning_rate": 0.00010905106812138994, + "loss": 0.8581, + "mean_token_accuracy": 0.7472487986087799, + "num_tokens": 114640011.0, + "step": 49600 + }, + { + "epoch": 0.4548455120564775, + "learning_rate": 0.00010903273127349409, + "loss": 0.8251, + "mean_token_accuracy": 0.7492351531982422, + "num_tokens": 114663381.0, + "step": 49610 + }, + { + "epoch": 0.45493719629595675, + "learning_rate": 0.00010901439442559824, + "loss": 0.8166, + "mean_token_accuracy": 0.753437340259552, + "num_tokens": 114687242.0, + "step": 49620 + }, + { + "epoch": 0.45502888053543594, + "learning_rate": 0.0001089960575777024, + "loss": 0.8655, + "mean_token_accuracy": 0.7422393739223481, + "num_tokens": 114709454.0, + "step": 49630 + }, + { + "epoch": 0.4551205647749152, + "learning_rate": 0.00010897772072980655, + "loss": 0.8238, + "mean_token_accuracy": 0.7529425501823426, + "num_tokens": 114732151.0, + "step": 49640 + }, + { + "epoch": 0.45521224901439444, + "learning_rate": 0.00010895938388191071, + "loss": 0.8713, + "mean_token_accuracy": 0.7446607828140259, + "num_tokens": 114755040.0, + "step": 49650 + }, + { + "epoch": 0.45530393325387364, + "learning_rate": 0.00010894104703401487, + "loss": 0.8351, + "mean_token_accuracy": 0.7471251487731934, + "num_tokens": 114778102.0, + "step": 49660 + }, + { + "epoch": 0.4553956174933529, + "learning_rate": 0.00010892271018611902, + "loss": 0.8518, + "mean_token_accuracy": 0.7474866032600402, + "num_tokens": 114800788.0, + "step": 49670 + }, + { + "epoch": 0.45548730173283214, + "learning_rate": 0.00010890437333822317, + "loss": 0.8561, + "mean_token_accuracy": 0.7449249029159546, + "num_tokens": 114823909.0, + "step": 49680 + }, + { + "epoch": 0.45557898597231133, + "learning_rate": 0.00010888603649032731, + "loss": 0.8545, + "mean_token_accuracy": 0.7440057277679444, + "num_tokens": 114847934.0, + "step": 49690 + }, + { + "epoch": 0.4556706702117906, + "learning_rate": 0.00010886769964243146, + "loss": 0.8459, + "mean_token_accuracy": 0.7479400277137757, + "num_tokens": 114871114.0, + "step": 49700 + }, + { + "epoch": 0.45576235445126984, + "learning_rate": 0.00010884936279453561, + "loss": 0.8441, + "mean_token_accuracy": 0.745722359418869, + "num_tokens": 114895228.0, + "step": 49710 + }, + { + "epoch": 0.4558540386907491, + "learning_rate": 0.00010883102594663979, + "loss": 0.8146, + "mean_token_accuracy": 0.7478174984455108, + "num_tokens": 114919367.0, + "step": 49720 + }, + { + "epoch": 0.4559457229302283, + "learning_rate": 0.00010881268909874394, + "loss": 0.8631, + "mean_token_accuracy": 0.7402715504169464, + "num_tokens": 114942509.0, + "step": 49730 + }, + { + "epoch": 0.45603740716970753, + "learning_rate": 0.00010879435225084808, + "loss": 0.8297, + "mean_token_accuracy": 0.7462266325950623, + "num_tokens": 114966233.0, + "step": 49740 + }, + { + "epoch": 0.4561290914091868, + "learning_rate": 0.00010877601540295223, + "loss": 0.8258, + "mean_token_accuracy": 0.7475348711013794, + "num_tokens": 114989497.0, + "step": 49750 + }, + { + "epoch": 0.456220775648666, + "learning_rate": 0.00010875767855505638, + "loss": 0.8924, + "mean_token_accuracy": 0.7382708609104156, + "num_tokens": 115012636.0, + "step": 49760 + }, + { + "epoch": 0.4563124598881452, + "learning_rate": 0.00010873934170716054, + "loss": 0.8237, + "mean_token_accuracy": 0.754587596654892, + "num_tokens": 115035701.0, + "step": 49770 + }, + { + "epoch": 0.4564041441276245, + "learning_rate": 0.0001087210048592647, + "loss": 0.8427, + "mean_token_accuracy": 0.7473047614097595, + "num_tokens": 115058173.0, + "step": 49780 + }, + { + "epoch": 0.4564958283671037, + "learning_rate": 0.00010870266801136885, + "loss": 0.8303, + "mean_token_accuracy": 0.7516798675060272, + "num_tokens": 115080946.0, + "step": 49790 + }, + { + "epoch": 0.4565875126065829, + "learning_rate": 0.000108684331163473, + "loss": 0.9069, + "mean_token_accuracy": 0.7308391451835632, + "num_tokens": 115104503.0, + "step": 49800 + }, + { + "epoch": 0.4566791968460622, + "learning_rate": 0.00010866599431557716, + "loss": 0.8685, + "mean_token_accuracy": 0.741806811094284, + "num_tokens": 115128179.0, + "step": 49810 + }, + { + "epoch": 0.45677088108554137, + "learning_rate": 0.00010864765746768131, + "loss": 0.8707, + "mean_token_accuracy": 0.7365410387516022, + "num_tokens": 115152009.0, + "step": 49820 + }, + { + "epoch": 0.4568625653250206, + "learning_rate": 0.00010862932061978546, + "loss": 0.8427, + "mean_token_accuracy": 0.7453692495822907, + "num_tokens": 115174952.0, + "step": 49830 + }, + { + "epoch": 0.45695424956449987, + "learning_rate": 0.00010861098377188961, + "loss": 0.8778, + "mean_token_accuracy": 0.7436991155147552, + "num_tokens": 115197963.0, + "step": 49840 + }, + { + "epoch": 0.4570459338039791, + "learning_rate": 0.00010859264692399378, + "loss": 0.8446, + "mean_token_accuracy": 0.7575132727622986, + "num_tokens": 115220780.0, + "step": 49850 + }, + { + "epoch": 0.4571376180434583, + "learning_rate": 0.00010857431007609793, + "loss": 0.8327, + "mean_token_accuracy": 0.7503166556358337, + "num_tokens": 115242933.0, + "step": 49860 + }, + { + "epoch": 0.45722930228293757, + "learning_rate": 0.00010855597322820208, + "loss": 0.8344, + "mean_token_accuracy": 0.7496700286865234, + "num_tokens": 115266172.0, + "step": 49870 + }, + { + "epoch": 0.4573209865224168, + "learning_rate": 0.00010853763638030623, + "loss": 0.8497, + "mean_token_accuracy": 0.7433329045772552, + "num_tokens": 115289280.0, + "step": 49880 + }, + { + "epoch": 0.457412670761896, + "learning_rate": 0.00010851929953241037, + "loss": 0.8299, + "mean_token_accuracy": 0.7510054588317872, + "num_tokens": 115312699.0, + "step": 49890 + }, + { + "epoch": 0.45750435500137526, + "learning_rate": 0.00010850096268451452, + "loss": 0.8395, + "mean_token_accuracy": 0.7443045854568482, + "num_tokens": 115335620.0, + "step": 49900 + }, + { + "epoch": 0.4575960392408545, + "learning_rate": 0.0001084826258366187, + "loss": 0.8996, + "mean_token_accuracy": 0.7296887338161469, + "num_tokens": 115358098.0, + "step": 49910 + }, + { + "epoch": 0.4576877234803337, + "learning_rate": 0.00010846428898872285, + "loss": 0.8163, + "mean_token_accuracy": 0.751824027299881, + "num_tokens": 115381361.0, + "step": 49920 + }, + { + "epoch": 0.45777940771981296, + "learning_rate": 0.00010844595214082701, + "loss": 0.8277, + "mean_token_accuracy": 0.7506865561008453, + "num_tokens": 115404842.0, + "step": 49930 + }, + { + "epoch": 0.4578710919592922, + "learning_rate": 0.00010842761529293115, + "loss": 0.8266, + "mean_token_accuracy": 0.7501639425754547, + "num_tokens": 115427625.0, + "step": 49940 + }, + { + "epoch": 0.4579627761987714, + "learning_rate": 0.0001084092784450353, + "loss": 0.8644, + "mean_token_accuracy": 0.7454055070877075, + "num_tokens": 115451230.0, + "step": 49950 + }, + { + "epoch": 0.45805446043825065, + "learning_rate": 0.00010839094159713945, + "loss": 0.8258, + "mean_token_accuracy": 0.7487506866455078, + "num_tokens": 115474683.0, + "step": 49960 + }, + { + "epoch": 0.4581461446777299, + "learning_rate": 0.0001083726047492436, + "loss": 0.8183, + "mean_token_accuracy": 0.7492614328861237, + "num_tokens": 115497894.0, + "step": 49970 + }, + { + "epoch": 0.45823782891720916, + "learning_rate": 0.00010835426790134777, + "loss": 0.8423, + "mean_token_accuracy": 0.749496477842331, + "num_tokens": 115521237.0, + "step": 49980 + }, + { + "epoch": 0.45832951315668835, + "learning_rate": 0.00010833593105345192, + "loss": 0.846, + "mean_token_accuracy": 0.746222198009491, + "num_tokens": 115544763.0, + "step": 49990 + }, + { + "epoch": 0.4584211973961676, + "learning_rate": 0.00010831759420555607, + "loss": 0.8175, + "mean_token_accuracy": 0.7521841049194335, + "num_tokens": 115568240.0, + "step": 50000 + }, + { + "epoch": 0.45851288163564685, + "learning_rate": 0.00010829925735766022, + "loss": 0.8484, + "mean_token_accuracy": 0.7403563261032104, + "num_tokens": 115591813.0, + "step": 50010 + }, + { + "epoch": 0.45860456587512605, + "learning_rate": 0.00010828092050976437, + "loss": 0.8313, + "mean_token_accuracy": 0.7544568061828614, + "num_tokens": 115614726.0, + "step": 50020 + }, + { + "epoch": 0.4586962501146053, + "learning_rate": 0.00010826258366186853, + "loss": 0.8242, + "mean_token_accuracy": 0.7494811654090882, + "num_tokens": 115638111.0, + "step": 50030 + }, + { + "epoch": 0.45878793435408455, + "learning_rate": 0.00010824424681397269, + "loss": 0.8091, + "mean_token_accuracy": 0.7566789090633392, + "num_tokens": 115661738.0, + "step": 50040 + }, + { + "epoch": 0.45887961859356374, + "learning_rate": 0.00010822590996607684, + "loss": 0.8165, + "mean_token_accuracy": 0.7553297936916351, + "num_tokens": 115684907.0, + "step": 50050 + }, + { + "epoch": 0.458971302833043, + "learning_rate": 0.000108207573118181, + "loss": 0.837, + "mean_token_accuracy": 0.7515370666980743, + "num_tokens": 115707567.0, + "step": 50060 + }, + { + "epoch": 0.45906298707252224, + "learning_rate": 0.00010818923627028515, + "loss": 0.8275, + "mean_token_accuracy": 0.754007738828659, + "num_tokens": 115730192.0, + "step": 50070 + }, + { + "epoch": 0.4591546713120015, + "learning_rate": 0.0001081708994223893, + "loss": 0.8023, + "mean_token_accuracy": 0.757024222612381, + "num_tokens": 115752620.0, + "step": 50080 + }, + { + "epoch": 0.4592463555514807, + "learning_rate": 0.00010815256257449344, + "loss": 0.8688, + "mean_token_accuracy": 0.7419677913188935, + "num_tokens": 115776581.0, + "step": 50090 + }, + { + "epoch": 0.45933803979095994, + "learning_rate": 0.00010813422572659759, + "loss": 0.8853, + "mean_token_accuracy": 0.7376410245895386, + "num_tokens": 115799978.0, + "step": 50100 + }, + { + "epoch": 0.4594297240304392, + "learning_rate": 0.00010811588887870177, + "loss": 0.8144, + "mean_token_accuracy": 0.7546159029006958, + "num_tokens": 115823279.0, + "step": 50110 + }, + { + "epoch": 0.4595214082699184, + "learning_rate": 0.00010809755203080592, + "loss": 0.8345, + "mean_token_accuracy": 0.7492096900939942, + "num_tokens": 115846249.0, + "step": 50120 + }, + { + "epoch": 0.45961309250939764, + "learning_rate": 0.00010807921518291007, + "loss": 0.8244, + "mean_token_accuracy": 0.7569547533988953, + "num_tokens": 115869287.0, + "step": 50130 + }, + { + "epoch": 0.4597047767488769, + "learning_rate": 0.00010806087833501421, + "loss": 0.8025, + "mean_token_accuracy": 0.7493510842323303, + "num_tokens": 115892147.0, + "step": 50140 + }, + { + "epoch": 0.4597964609883561, + "learning_rate": 0.00010804254148711836, + "loss": 0.8586, + "mean_token_accuracy": 0.7442805290222168, + "num_tokens": 115915570.0, + "step": 50150 + }, + { + "epoch": 0.45988814522783533, + "learning_rate": 0.00010802420463922251, + "loss": 0.837, + "mean_token_accuracy": 0.7487399339675903, + "num_tokens": 115938993.0, + "step": 50160 + }, + { + "epoch": 0.4599798294673146, + "learning_rate": 0.00010800586779132669, + "loss": 0.8402, + "mean_token_accuracy": 0.7479621529579162, + "num_tokens": 115961349.0, + "step": 50170 + }, + { + "epoch": 0.4600715137067938, + "learning_rate": 0.00010798753094343083, + "loss": 0.8231, + "mean_token_accuracy": 0.7495421350002289, + "num_tokens": 115984834.0, + "step": 50180 + }, + { + "epoch": 0.46016319794627303, + "learning_rate": 0.00010796919409553498, + "loss": 0.8541, + "mean_token_accuracy": 0.7462188839912415, + "num_tokens": 116007818.0, + "step": 50190 + }, + { + "epoch": 0.4602548821857523, + "learning_rate": 0.00010795085724763913, + "loss": 0.8535, + "mean_token_accuracy": 0.7470133304595947, + "num_tokens": 116031305.0, + "step": 50200 + }, + { + "epoch": 0.46034656642523153, + "learning_rate": 0.00010793252039974329, + "loss": 0.8249, + "mean_token_accuracy": 0.7510017812252044, + "num_tokens": 116054213.0, + "step": 50210 + }, + { + "epoch": 0.4604382506647107, + "learning_rate": 0.00010791418355184744, + "loss": 0.8375, + "mean_token_accuracy": 0.7504799664020538, + "num_tokens": 116076506.0, + "step": 50220 + }, + { + "epoch": 0.46052993490419, + "learning_rate": 0.00010789584670395159, + "loss": 0.8627, + "mean_token_accuracy": 0.7414623498916626, + "num_tokens": 116100639.0, + "step": 50230 + }, + { + "epoch": 0.4606216191436692, + "learning_rate": 0.00010787750985605576, + "loss": 0.8896, + "mean_token_accuracy": 0.7352072656154632, + "num_tokens": 116124090.0, + "step": 50240 + }, + { + "epoch": 0.4607133033831484, + "learning_rate": 0.00010785917300815991, + "loss": 0.8479, + "mean_token_accuracy": 0.7485179603099823, + "num_tokens": 116146498.0, + "step": 50250 + }, + { + "epoch": 0.46080498762262767, + "learning_rate": 0.00010784083616026406, + "loss": 0.8164, + "mean_token_accuracy": 0.7551505208015442, + "num_tokens": 116169667.0, + "step": 50260 + }, + { + "epoch": 0.4608966718621069, + "learning_rate": 0.00010782249931236821, + "loss": 0.8514, + "mean_token_accuracy": 0.7464648723602295, + "num_tokens": 116192840.0, + "step": 50270 + }, + { + "epoch": 0.4609883561015861, + "learning_rate": 0.00010780416246447236, + "loss": 0.824, + "mean_token_accuracy": 0.7510474324226379, + "num_tokens": 116215831.0, + "step": 50280 + }, + { + "epoch": 0.46108004034106537, + "learning_rate": 0.0001077858256165765, + "loss": 0.8225, + "mean_token_accuracy": 0.7547004103660584, + "num_tokens": 116238647.0, + "step": 50290 + }, + { + "epoch": 0.4611717245805446, + "learning_rate": 0.00010776748876868068, + "loss": 0.8619, + "mean_token_accuracy": 0.7416106343269349, + "num_tokens": 116261417.0, + "step": 50300 + }, + { + "epoch": 0.4612634088200238, + "learning_rate": 0.00010774915192078483, + "loss": 0.8663, + "mean_token_accuracy": 0.7462671041488648, + "num_tokens": 116285092.0, + "step": 50310 + }, + { + "epoch": 0.46135509305950306, + "learning_rate": 0.00010773081507288898, + "loss": 0.8562, + "mean_token_accuracy": 0.7486227571964263, + "num_tokens": 116308572.0, + "step": 50320 + }, + { + "epoch": 0.4614467772989823, + "learning_rate": 0.00010771247822499314, + "loss": 0.8318, + "mean_token_accuracy": 0.7512663900852203, + "num_tokens": 116331203.0, + "step": 50330 + }, + { + "epoch": 0.46153846153846156, + "learning_rate": 0.00010769414137709727, + "loss": 0.8212, + "mean_token_accuracy": 0.7521014273166656, + "num_tokens": 116353705.0, + "step": 50340 + }, + { + "epoch": 0.46163014577794076, + "learning_rate": 0.00010767580452920143, + "loss": 0.8595, + "mean_token_accuracy": 0.7383383989334107, + "num_tokens": 116376058.0, + "step": 50350 + }, + { + "epoch": 0.46172183001742, + "learning_rate": 0.00010765746768130558, + "loss": 0.8467, + "mean_token_accuracy": 0.7493795573711395, + "num_tokens": 116399235.0, + "step": 50360 + }, + { + "epoch": 0.46181351425689926, + "learning_rate": 0.00010763913083340976, + "loss": 0.8411, + "mean_token_accuracy": 0.7499105215072632, + "num_tokens": 116422093.0, + "step": 50370 + }, + { + "epoch": 0.46190519849637846, + "learning_rate": 0.0001076207939855139, + "loss": 0.8264, + "mean_token_accuracy": 0.7485403299331665, + "num_tokens": 116444540.0, + "step": 50380 + }, + { + "epoch": 0.4619968827358577, + "learning_rate": 0.00010760245713761805, + "loss": 0.8763, + "mean_token_accuracy": 0.7494730412960052, + "num_tokens": 116468067.0, + "step": 50390 + }, + { + "epoch": 0.46208856697533696, + "learning_rate": 0.0001075841202897222, + "loss": 0.8229, + "mean_token_accuracy": 0.7540560901165009, + "num_tokens": 116490872.0, + "step": 50400 + }, + { + "epoch": 0.46218025121481615, + "learning_rate": 0.00010756578344182635, + "loss": 0.871, + "mean_token_accuracy": 0.7454632878303528, + "num_tokens": 116513739.0, + "step": 50410 + }, + { + "epoch": 0.4622719354542954, + "learning_rate": 0.0001075474465939305, + "loss": 0.8204, + "mean_token_accuracy": 0.7500062763690949, + "num_tokens": 116536617.0, + "step": 50420 + }, + { + "epoch": 0.46236361969377465, + "learning_rate": 0.00010752910974603465, + "loss": 0.864, + "mean_token_accuracy": 0.7448347449302674, + "num_tokens": 116559527.0, + "step": 50430 + }, + { + "epoch": 0.46245530393325385, + "learning_rate": 0.00010751077289813882, + "loss": 0.8291, + "mean_token_accuracy": 0.7494826912879944, + "num_tokens": 116582109.0, + "step": 50440 + }, + { + "epoch": 0.4625469881727331, + "learning_rate": 0.00010749243605024297, + "loss": 0.8602, + "mean_token_accuracy": 0.7425334811210632, + "num_tokens": 116605397.0, + "step": 50450 + }, + { + "epoch": 0.46263867241221235, + "learning_rate": 0.00010747409920234712, + "loss": 0.8183, + "mean_token_accuracy": 0.7540872037410736, + "num_tokens": 116627798.0, + "step": 50460 + }, + { + "epoch": 0.4627303566516916, + "learning_rate": 0.00010745576235445128, + "loss": 0.8242, + "mean_token_accuracy": 0.7543343484401703, + "num_tokens": 116650549.0, + "step": 50470 + }, + { + "epoch": 0.4628220408911708, + "learning_rate": 0.00010743742550655543, + "loss": 0.8319, + "mean_token_accuracy": 0.7507722616195679, + "num_tokens": 116673922.0, + "step": 50480 + }, + { + "epoch": 0.46291372513065004, + "learning_rate": 0.00010741908865865957, + "loss": 0.8355, + "mean_token_accuracy": 0.7464515626430511, + "num_tokens": 116697639.0, + "step": 50490 + }, + { + "epoch": 0.4630054093701293, + "learning_rate": 0.00010740075181076374, + "loss": 0.8437, + "mean_token_accuracy": 0.7505419135093689, + "num_tokens": 116720789.0, + "step": 50500 + }, + { + "epoch": 0.4630970936096085, + "learning_rate": 0.0001073824149628679, + "loss": 0.8655, + "mean_token_accuracy": 0.7391029357910156, + "num_tokens": 116744169.0, + "step": 50510 + }, + { + "epoch": 0.46318877784908774, + "learning_rate": 0.00010736407811497205, + "loss": 0.8311, + "mean_token_accuracy": 0.7503938496112823, + "num_tokens": 116766188.0, + "step": 50520 + }, + { + "epoch": 0.463280462088567, + "learning_rate": 0.0001073457412670762, + "loss": 0.8614, + "mean_token_accuracy": 0.744571739435196, + "num_tokens": 116788861.0, + "step": 50530 + }, + { + "epoch": 0.4633721463280462, + "learning_rate": 0.00010732740441918034, + "loss": 0.8259, + "mean_token_accuracy": 0.749758392572403, + "num_tokens": 116811487.0, + "step": 50540 + }, + { + "epoch": 0.46346383056752544, + "learning_rate": 0.00010730906757128449, + "loss": 0.8064, + "mean_token_accuracy": 0.753113043308258, + "num_tokens": 116835181.0, + "step": 50550 + }, + { + "epoch": 0.4635555148070047, + "learning_rate": 0.00010729073072338864, + "loss": 0.8395, + "mean_token_accuracy": 0.7491614937782287, + "num_tokens": 116857859.0, + "step": 50560 + }, + { + "epoch": 0.4636471990464839, + "learning_rate": 0.00010727239387549282, + "loss": 0.8222, + "mean_token_accuracy": 0.7530656456947327, + "num_tokens": 116881321.0, + "step": 50570 + }, + { + "epoch": 0.46373888328596313, + "learning_rate": 0.00010725405702759696, + "loss": 0.793, + "mean_token_accuracy": 0.7553530097007751, + "num_tokens": 116904790.0, + "step": 50580 + }, + { + "epoch": 0.4638305675254424, + "learning_rate": 0.00010723572017970111, + "loss": 0.8549, + "mean_token_accuracy": 0.7461807429790497, + "num_tokens": 116928194.0, + "step": 50590 + }, + { + "epoch": 0.46392225176492163, + "learning_rate": 0.00010721738333180526, + "loss": 0.8175, + "mean_token_accuracy": 0.7489982545375824, + "num_tokens": 116951407.0, + "step": 50600 + }, + { + "epoch": 0.46401393600440083, + "learning_rate": 0.00010719904648390942, + "loss": 0.8439, + "mean_token_accuracy": 0.7496041774749755, + "num_tokens": 116975147.0, + "step": 50610 + }, + { + "epoch": 0.4641056202438801, + "learning_rate": 0.00010718070963601357, + "loss": 0.8252, + "mean_token_accuracy": 0.7445078730583191, + "num_tokens": 116999365.0, + "step": 50620 + }, + { + "epoch": 0.46419730448335933, + "learning_rate": 0.00010716237278811773, + "loss": 0.8451, + "mean_token_accuracy": 0.7497836112976074, + "num_tokens": 117022386.0, + "step": 50630 + }, + { + "epoch": 0.4642889887228385, + "learning_rate": 0.00010714403594022188, + "loss": 0.8437, + "mean_token_accuracy": 0.7496808290481567, + "num_tokens": 117045041.0, + "step": 50640 + }, + { + "epoch": 0.4643806729623178, + "learning_rate": 0.00010712569909232604, + "loss": 0.853, + "mean_token_accuracy": 0.7458152651786805, + "num_tokens": 117068307.0, + "step": 50650 + }, + { + "epoch": 0.464472357201797, + "learning_rate": 0.00010710736224443019, + "loss": 0.8496, + "mean_token_accuracy": 0.7513097286224365, + "num_tokens": 117091801.0, + "step": 50660 + }, + { + "epoch": 0.4645640414412762, + "learning_rate": 0.00010708902539653434, + "loss": 0.7991, + "mean_token_accuracy": 0.7584814131259918, + "num_tokens": 117114593.0, + "step": 50670 + }, + { + "epoch": 0.46465572568075547, + "learning_rate": 0.00010707068854863849, + "loss": 0.874, + "mean_token_accuracy": 0.7379404366016388, + "num_tokens": 117137486.0, + "step": 50680 + }, + { + "epoch": 0.4647474099202347, + "learning_rate": 0.00010705235170074264, + "loss": 0.8847, + "mean_token_accuracy": 0.7391998946666718, + "num_tokens": 117160033.0, + "step": 50690 + }, + { + "epoch": 0.464839094159714, + "learning_rate": 0.00010703401485284681, + "loss": 0.8627, + "mean_token_accuracy": 0.7434830665588379, + "num_tokens": 117183427.0, + "step": 50700 + }, + { + "epoch": 0.46493077839919317, + "learning_rate": 0.00010701567800495096, + "loss": 0.8555, + "mean_token_accuracy": 0.7426767408847809, + "num_tokens": 117206345.0, + "step": 50710 + }, + { + "epoch": 0.4650224626386724, + "learning_rate": 0.00010699734115705511, + "loss": 0.8835, + "mean_token_accuracy": 0.7401986122131348, + "num_tokens": 117229219.0, + "step": 50720 + }, + { + "epoch": 0.46511414687815167, + "learning_rate": 0.00010697900430915926, + "loss": 0.8578, + "mean_token_accuracy": 0.7393283247947693, + "num_tokens": 117252991.0, + "step": 50730 + }, + { + "epoch": 0.46520583111763086, + "learning_rate": 0.0001069606674612634, + "loss": 0.7975, + "mean_token_accuracy": 0.7621454775333405, + "num_tokens": 117275853.0, + "step": 50740 + }, + { + "epoch": 0.4652975153571101, + "learning_rate": 0.00010694233061336755, + "loss": 0.823, + "mean_token_accuracy": 0.7500155448913575, + "num_tokens": 117298624.0, + "step": 50750 + }, + { + "epoch": 0.46538919959658936, + "learning_rate": 0.00010692399376547173, + "loss": 0.8217, + "mean_token_accuracy": 0.7510518133640289, + "num_tokens": 117322138.0, + "step": 50760 + }, + { + "epoch": 0.46548088383606856, + "learning_rate": 0.00010690565691757589, + "loss": 0.8252, + "mean_token_accuracy": 0.748747569322586, + "num_tokens": 117345049.0, + "step": 50770 + }, + { + "epoch": 0.4655725680755478, + "learning_rate": 0.00010688732006968002, + "loss": 0.8154, + "mean_token_accuracy": 0.7526210367679596, + "num_tokens": 117367844.0, + "step": 50780 + }, + { + "epoch": 0.46566425231502706, + "learning_rate": 0.00010686898322178418, + "loss": 0.891, + "mean_token_accuracy": 0.7360921025276184, + "num_tokens": 117391359.0, + "step": 50790 + }, + { + "epoch": 0.46575593655450626, + "learning_rate": 0.00010685064637388833, + "loss": 0.8708, + "mean_token_accuracy": 0.7436611413955688, + "num_tokens": 117414531.0, + "step": 50800 + }, + { + "epoch": 0.4658476207939855, + "learning_rate": 0.00010683230952599248, + "loss": 0.7885, + "mean_token_accuracy": 0.7603997647762298, + "num_tokens": 117437361.0, + "step": 50810 + }, + { + "epoch": 0.46593930503346476, + "learning_rate": 0.00010681397267809663, + "loss": 0.8376, + "mean_token_accuracy": 0.7506824672222138, + "num_tokens": 117460283.0, + "step": 50820 + }, + { + "epoch": 0.466030989272944, + "learning_rate": 0.0001067956358302008, + "loss": 0.8133, + "mean_token_accuracy": 0.7531838774681091, + "num_tokens": 117482509.0, + "step": 50830 + }, + { + "epoch": 0.4661226735124232, + "learning_rate": 0.00010677729898230495, + "loss": 0.8531, + "mean_token_accuracy": 0.7507034957408905, + "num_tokens": 117506382.0, + "step": 50840 + }, + { + "epoch": 0.46621435775190245, + "learning_rate": 0.0001067589621344091, + "loss": 0.8281, + "mean_token_accuracy": 0.7464346587657928, + "num_tokens": 117529661.0, + "step": 50850 + }, + { + "epoch": 0.4663060419913817, + "learning_rate": 0.00010674062528651325, + "loss": 0.8491, + "mean_token_accuracy": 0.7451833069324494, + "num_tokens": 117552202.0, + "step": 50860 + }, + { + "epoch": 0.4663977262308609, + "learning_rate": 0.0001067222884386174, + "loss": 0.8243, + "mean_token_accuracy": 0.748199737071991, + "num_tokens": 117576254.0, + "step": 50870 + }, + { + "epoch": 0.46648941047034015, + "learning_rate": 0.00010670395159072156, + "loss": 0.8353, + "mean_token_accuracy": 0.7499429762363434, + "num_tokens": 117599490.0, + "step": 50880 + }, + { + "epoch": 0.4665810947098194, + "learning_rate": 0.00010668561474282572, + "loss": 0.8031, + "mean_token_accuracy": 0.7485783219337463, + "num_tokens": 117622567.0, + "step": 50890 + }, + { + "epoch": 0.4666727789492986, + "learning_rate": 0.00010666727789492987, + "loss": 0.8374, + "mean_token_accuracy": 0.7473032593727111, + "num_tokens": 117645775.0, + "step": 50900 + }, + { + "epoch": 0.46676446318877785, + "learning_rate": 0.00010664894104703403, + "loss": 0.8202, + "mean_token_accuracy": 0.7585340678691864, + "num_tokens": 117669341.0, + "step": 50910 + }, + { + "epoch": 0.4668561474282571, + "learning_rate": 0.00010663060419913818, + "loss": 0.8701, + "mean_token_accuracy": 0.7439858019351959, + "num_tokens": 117691666.0, + "step": 50920 + }, + { + "epoch": 0.4669478316677363, + "learning_rate": 0.00010661226735124233, + "loss": 0.8275, + "mean_token_accuracy": 0.7561112999916076, + "num_tokens": 117715316.0, + "step": 50930 + }, + { + "epoch": 0.46703951590721554, + "learning_rate": 0.00010659393050334647, + "loss": 0.8734, + "mean_token_accuracy": 0.740497225522995, + "num_tokens": 117738787.0, + "step": 50940 + }, + { + "epoch": 0.4671312001466948, + "learning_rate": 0.00010657559365545062, + "loss": 0.8505, + "mean_token_accuracy": 0.7452231168746948, + "num_tokens": 117761967.0, + "step": 50950 + }, + { + "epoch": 0.46722288438617404, + "learning_rate": 0.0001065572568075548, + "loss": 0.8472, + "mean_token_accuracy": 0.7463249921798706, + "num_tokens": 117784543.0, + "step": 50960 + }, + { + "epoch": 0.46731456862565324, + "learning_rate": 0.00010653891995965895, + "loss": 0.8127, + "mean_token_accuracy": 0.7490747451782227, + "num_tokens": 117806932.0, + "step": 50970 + }, + { + "epoch": 0.4674062528651325, + "learning_rate": 0.00010652058311176309, + "loss": 0.8586, + "mean_token_accuracy": 0.7450135529041291, + "num_tokens": 117830057.0, + "step": 50980 + }, + { + "epoch": 0.46749793710461174, + "learning_rate": 0.00010650224626386724, + "loss": 0.8774, + "mean_token_accuracy": 0.7434897541999816, + "num_tokens": 117853793.0, + "step": 50990 + }, + { + "epoch": 0.46758962134409093, + "learning_rate": 0.00010648390941597139, + "loss": 0.8635, + "mean_token_accuracy": 0.7430111706256867, + "num_tokens": 117876448.0, + "step": 51000 + }, + { + "epoch": 0.4676813055835702, + "learning_rate": 0.00010646557256807554, + "loss": 0.8815, + "mean_token_accuracy": 0.7391182601451873, + "num_tokens": 117899109.0, + "step": 51010 + }, + { + "epoch": 0.46777298982304943, + "learning_rate": 0.00010644723572017972, + "loss": 0.8334, + "mean_token_accuracy": 0.7455284893512726, + "num_tokens": 117923303.0, + "step": 51020 + }, + { + "epoch": 0.46786467406252863, + "learning_rate": 0.00010642889887228386, + "loss": 0.8003, + "mean_token_accuracy": 0.7555950045585632, + "num_tokens": 117945852.0, + "step": 51030 + }, + { + "epoch": 0.4679563583020079, + "learning_rate": 0.00010641056202438801, + "loss": 0.8312, + "mean_token_accuracy": 0.7510682940483093, + "num_tokens": 117970004.0, + "step": 51040 + }, + { + "epoch": 0.46804804254148713, + "learning_rate": 0.00010639222517649217, + "loss": 0.8312, + "mean_token_accuracy": 0.7443981349468232, + "num_tokens": 117991660.0, + "step": 51050 + }, + { + "epoch": 0.4681397267809663, + "learning_rate": 0.00010637388832859632, + "loss": 0.8511, + "mean_token_accuracy": 0.7525094747543335, + "num_tokens": 118014556.0, + "step": 51060 + }, + { + "epoch": 0.4682314110204456, + "learning_rate": 0.00010635555148070047, + "loss": 0.8416, + "mean_token_accuracy": 0.7467299461364746, + "num_tokens": 118037560.0, + "step": 51070 + }, + { + "epoch": 0.4683230952599248, + "learning_rate": 0.00010633721463280462, + "loss": 0.8672, + "mean_token_accuracy": 0.7387905538082122, + "num_tokens": 118060953.0, + "step": 51080 + }, + { + "epoch": 0.4684147794994041, + "learning_rate": 0.00010631887778490879, + "loss": 0.8508, + "mean_token_accuracy": 0.7508937537670135, + "num_tokens": 118084704.0, + "step": 51090 + }, + { + "epoch": 0.46850646373888327, + "learning_rate": 0.00010630054093701294, + "loss": 0.858, + "mean_token_accuracy": 0.7452883899211884, + "num_tokens": 118108778.0, + "step": 51100 + }, + { + "epoch": 0.4685981479783625, + "learning_rate": 0.00010628220408911709, + "loss": 0.8453, + "mean_token_accuracy": 0.7486472249031066, + "num_tokens": 118131700.0, + "step": 51110 + }, + { + "epoch": 0.4686898322178418, + "learning_rate": 0.00010626386724122124, + "loss": 0.8769, + "mean_token_accuracy": 0.7451722025871277, + "num_tokens": 118155078.0, + "step": 51120 + }, + { + "epoch": 0.46878151645732097, + "learning_rate": 0.0001062455303933254, + "loss": 0.8744, + "mean_token_accuracy": 0.743290901184082, + "num_tokens": 118178973.0, + "step": 51130 + }, + { + "epoch": 0.4688732006968002, + "learning_rate": 0.00010622719354542953, + "loss": 0.8354, + "mean_token_accuracy": 0.7442569673061371, + "num_tokens": 118202027.0, + "step": 51140 + }, + { + "epoch": 0.46896488493627947, + "learning_rate": 0.00010620885669753371, + "loss": 0.8316, + "mean_token_accuracy": 0.7528537273406982, + "num_tokens": 118225208.0, + "step": 51150 + }, + { + "epoch": 0.46905656917575866, + "learning_rate": 0.00010619051984963786, + "loss": 0.8307, + "mean_token_accuracy": 0.7523713350296021, + "num_tokens": 118248682.0, + "step": 51160 + }, + { + "epoch": 0.4691482534152379, + "learning_rate": 0.00010617218300174201, + "loss": 0.8585, + "mean_token_accuracy": 0.7432997345924377, + "num_tokens": 118271357.0, + "step": 51170 + }, + { + "epoch": 0.46923993765471717, + "learning_rate": 0.00010615384615384615, + "loss": 0.8127, + "mean_token_accuracy": 0.7542767465114594, + "num_tokens": 118293294.0, + "step": 51180 + }, + { + "epoch": 0.46933162189419636, + "learning_rate": 0.0001061355093059503, + "loss": 0.8512, + "mean_token_accuracy": 0.7457583487033844, + "num_tokens": 118316071.0, + "step": 51190 + }, + { + "epoch": 0.4694233061336756, + "learning_rate": 0.00010611717245805446, + "loss": 0.805, + "mean_token_accuracy": 0.7538500905036927, + "num_tokens": 118338236.0, + "step": 51200 + }, + { + "epoch": 0.46951499037315486, + "learning_rate": 0.00010609883561015861, + "loss": 0.8382, + "mean_token_accuracy": 0.7423735499382019, + "num_tokens": 118362457.0, + "step": 51210 + }, + { + "epoch": 0.4696066746126341, + "learning_rate": 0.00010608049876226279, + "loss": 0.8256, + "mean_token_accuracy": 0.7476546823978424, + "num_tokens": 118386486.0, + "step": 51220 + }, + { + "epoch": 0.4696983588521133, + "learning_rate": 0.00010606216191436693, + "loss": 0.8517, + "mean_token_accuracy": 0.7486424028873444, + "num_tokens": 118410419.0, + "step": 51230 + }, + { + "epoch": 0.46979004309159256, + "learning_rate": 0.00010604382506647108, + "loss": 0.829, + "mean_token_accuracy": 0.7476514160633088, + "num_tokens": 118433801.0, + "step": 51240 + }, + { + "epoch": 0.4698817273310718, + "learning_rate": 0.00010602548821857523, + "loss": 0.8316, + "mean_token_accuracy": 0.7491062879562378, + "num_tokens": 118456782.0, + "step": 51250 + }, + { + "epoch": 0.469973411570551, + "learning_rate": 0.00010600715137067938, + "loss": 0.8196, + "mean_token_accuracy": 0.7526462316513062, + "num_tokens": 118479643.0, + "step": 51260 + }, + { + "epoch": 0.47006509581003025, + "learning_rate": 0.00010598881452278353, + "loss": 0.8924, + "mean_token_accuracy": 0.7386376023292541, + "num_tokens": 118502213.0, + "step": 51270 + }, + { + "epoch": 0.4701567800495095, + "learning_rate": 0.0001059704776748877, + "loss": 0.799, + "mean_token_accuracy": 0.7570102334022522, + "num_tokens": 118525687.0, + "step": 51280 + }, + { + "epoch": 0.4702484642889887, + "learning_rate": 0.00010595214082699185, + "loss": 0.8706, + "mean_token_accuracy": 0.7403916001319886, + "num_tokens": 118549338.0, + "step": 51290 + }, + { + "epoch": 0.47034014852846795, + "learning_rate": 0.000105933803979096, + "loss": 0.8349, + "mean_token_accuracy": 0.7466923415660858, + "num_tokens": 118572386.0, + "step": 51300 + }, + { + "epoch": 0.4704318327679472, + "learning_rate": 0.00010591546713120015, + "loss": 0.7769, + "mean_token_accuracy": 0.7625176906585693, + "num_tokens": 118595336.0, + "step": 51310 + }, + { + "epoch": 0.47052351700742645, + "learning_rate": 0.0001058971302833043, + "loss": 0.8196, + "mean_token_accuracy": 0.7529705107212067, + "num_tokens": 118619430.0, + "step": 51320 + }, + { + "epoch": 0.47061520124690565, + "learning_rate": 0.00010587879343540846, + "loss": 0.8369, + "mean_token_accuracy": 0.7511988520622254, + "num_tokens": 118642805.0, + "step": 51330 + }, + { + "epoch": 0.4707068854863849, + "learning_rate": 0.0001058604565875126, + "loss": 0.8554, + "mean_token_accuracy": 0.7438337802886963, + "num_tokens": 118665617.0, + "step": 51340 + }, + { + "epoch": 0.47079856972586415, + "learning_rate": 0.00010584211973961678, + "loss": 0.851, + "mean_token_accuracy": 0.7440335154533386, + "num_tokens": 118688621.0, + "step": 51350 + }, + { + "epoch": 0.47089025396534334, + "learning_rate": 0.00010582378289172093, + "loss": 0.8638, + "mean_token_accuracy": 0.7429041504859925, + "num_tokens": 118711355.0, + "step": 51360 + }, + { + "epoch": 0.4709819382048226, + "learning_rate": 0.00010580544604382508, + "loss": 0.8499, + "mean_token_accuracy": 0.7501009702682495, + "num_tokens": 118733886.0, + "step": 51370 + }, + { + "epoch": 0.47107362244430184, + "learning_rate": 0.00010578710919592922, + "loss": 0.817, + "mean_token_accuracy": 0.7575704097747803, + "num_tokens": 118756994.0, + "step": 51380 + }, + { + "epoch": 0.47116530668378104, + "learning_rate": 0.00010576877234803337, + "loss": 0.8123, + "mean_token_accuracy": 0.7541246056556702, + "num_tokens": 118779958.0, + "step": 51390 + }, + { + "epoch": 0.4712569909232603, + "learning_rate": 0.00010575043550013752, + "loss": 0.8106, + "mean_token_accuracy": 0.7564858138561249, + "num_tokens": 118803401.0, + "step": 51400 + }, + { + "epoch": 0.47134867516273954, + "learning_rate": 0.0001057320986522417, + "loss": 0.8505, + "mean_token_accuracy": 0.7455509245395661, + "num_tokens": 118825733.0, + "step": 51410 + }, + { + "epoch": 0.47144035940221873, + "learning_rate": 0.00010571376180434585, + "loss": 0.855, + "mean_token_accuracy": 0.7454495429992676, + "num_tokens": 118848401.0, + "step": 51420 + }, + { + "epoch": 0.471532043641698, + "learning_rate": 0.00010569542495644999, + "loss": 0.8875, + "mean_token_accuracy": 0.738635241985321, + "num_tokens": 118871766.0, + "step": 51430 + }, + { + "epoch": 0.47162372788117723, + "learning_rate": 0.00010567708810855414, + "loss": 0.8149, + "mean_token_accuracy": 0.7502297759056091, + "num_tokens": 118895310.0, + "step": 51440 + }, + { + "epoch": 0.4717154121206565, + "learning_rate": 0.0001056587512606583, + "loss": 0.8037, + "mean_token_accuracy": 0.7565677106380463, + "num_tokens": 118918312.0, + "step": 51450 + }, + { + "epoch": 0.4718070963601357, + "learning_rate": 0.00010564041441276245, + "loss": 0.8372, + "mean_token_accuracy": 0.7516836285591125, + "num_tokens": 118940763.0, + "step": 51460 + }, + { + "epoch": 0.47189878059961493, + "learning_rate": 0.0001056220775648666, + "loss": 0.8483, + "mean_token_accuracy": 0.7425761103630066, + "num_tokens": 118963901.0, + "step": 51470 + }, + { + "epoch": 0.4719904648390942, + "learning_rate": 0.00010560374071697076, + "loss": 0.8102, + "mean_token_accuracy": 0.7571872532367706, + "num_tokens": 118987206.0, + "step": 51480 + }, + { + "epoch": 0.4720821490785734, + "learning_rate": 0.00010558540386907491, + "loss": 0.8586, + "mean_token_accuracy": 0.7401663601398468, + "num_tokens": 119010643.0, + "step": 51490 + }, + { + "epoch": 0.4721738333180526, + "learning_rate": 0.00010556706702117907, + "loss": 0.8282, + "mean_token_accuracy": 0.7522598505020142, + "num_tokens": 119034049.0, + "step": 51500 + }, + { + "epoch": 0.4722655175575319, + "learning_rate": 0.00010554873017328322, + "loss": 0.81, + "mean_token_accuracy": 0.7589615702629089, + "num_tokens": 119056837.0, + "step": 51510 + }, + { + "epoch": 0.4723572017970111, + "learning_rate": 0.00010553039332538737, + "loss": 0.8775, + "mean_token_accuracy": 0.7378575384616852, + "num_tokens": 119079421.0, + "step": 51520 + }, + { + "epoch": 0.4724488860364903, + "learning_rate": 0.00010551205647749152, + "loss": 0.8418, + "mean_token_accuracy": 0.7503543257713318, + "num_tokens": 119102716.0, + "step": 51530 + }, + { + "epoch": 0.4725405702759696, + "learning_rate": 0.00010549371962959566, + "loss": 0.8419, + "mean_token_accuracy": 0.7465055823326111, + "num_tokens": 119125546.0, + "step": 51540 + }, + { + "epoch": 0.47263225451544877, + "learning_rate": 0.00010547538278169984, + "loss": 0.8375, + "mean_token_accuracy": 0.7422538876533509, + "num_tokens": 119147921.0, + "step": 51550 + }, + { + "epoch": 0.472723938754928, + "learning_rate": 0.00010545704593380399, + "loss": 0.8145, + "mean_token_accuracy": 0.7520704388618469, + "num_tokens": 119171297.0, + "step": 51560 + }, + { + "epoch": 0.47281562299440727, + "learning_rate": 0.00010543870908590814, + "loss": 0.8284, + "mean_token_accuracy": 0.7501891314983368, + "num_tokens": 119194705.0, + "step": 51570 + }, + { + "epoch": 0.4729073072338865, + "learning_rate": 0.00010542037223801228, + "loss": 0.8495, + "mean_token_accuracy": 0.7503993451595307, + "num_tokens": 119218328.0, + "step": 51580 + }, + { + "epoch": 0.4729989914733657, + "learning_rate": 0.00010540203539011643, + "loss": 0.8372, + "mean_token_accuracy": 0.7520356714725495, + "num_tokens": 119241496.0, + "step": 51590 + }, + { + "epoch": 0.47309067571284497, + "learning_rate": 0.00010538369854222059, + "loss": 0.8557, + "mean_token_accuracy": 0.74845569729805, + "num_tokens": 119264681.0, + "step": 51600 + }, + { + "epoch": 0.4731823599523242, + "learning_rate": 0.00010536536169432476, + "loss": 0.788, + "mean_token_accuracy": 0.7576924562454224, + "num_tokens": 119288006.0, + "step": 51610 + }, + { + "epoch": 0.4732740441918034, + "learning_rate": 0.00010534702484642892, + "loss": 0.808, + "mean_token_accuracy": 0.7529437422752381, + "num_tokens": 119310643.0, + "step": 51620 + }, + { + "epoch": 0.47336572843128266, + "learning_rate": 0.00010532868799853305, + "loss": 0.8412, + "mean_token_accuracy": 0.7463583409786224, + "num_tokens": 119333862.0, + "step": 51630 + }, + { + "epoch": 0.4734574126707619, + "learning_rate": 0.0001053103511506372, + "loss": 0.8165, + "mean_token_accuracy": 0.7486286044120789, + "num_tokens": 119357247.0, + "step": 51640 + }, + { + "epoch": 0.4735490969102411, + "learning_rate": 0.00010529201430274136, + "loss": 0.8608, + "mean_token_accuracy": 0.7437616527080536, + "num_tokens": 119380397.0, + "step": 51650 + }, + { + "epoch": 0.47364078114972036, + "learning_rate": 0.00010527367745484551, + "loss": 0.8292, + "mean_token_accuracy": 0.752439022064209, + "num_tokens": 119403250.0, + "step": 51660 + }, + { + "epoch": 0.4737324653891996, + "learning_rate": 0.00010525534060694966, + "loss": 0.8784, + "mean_token_accuracy": 0.7407907843589783, + "num_tokens": 119426124.0, + "step": 51670 + }, + { + "epoch": 0.4738241496286788, + "learning_rate": 0.00010523700375905383, + "loss": 0.861, + "mean_token_accuracy": 0.7457657277584075, + "num_tokens": 119448976.0, + "step": 51680 + }, + { + "epoch": 0.47391583386815805, + "learning_rate": 0.00010521866691115798, + "loss": 0.8079, + "mean_token_accuracy": 0.7516883432865142, + "num_tokens": 119472277.0, + "step": 51690 + }, + { + "epoch": 0.4740075181076373, + "learning_rate": 0.00010520033006326213, + "loss": 0.8496, + "mean_token_accuracy": 0.7472087979316712, + "num_tokens": 119496364.0, + "step": 51700 + }, + { + "epoch": 0.47409920234711656, + "learning_rate": 0.00010518199321536628, + "loss": 0.7881, + "mean_token_accuracy": 0.761373096704483, + "num_tokens": 119519462.0, + "step": 51710 + }, + { + "epoch": 0.47419088658659575, + "learning_rate": 0.00010516365636747044, + "loss": 0.8396, + "mean_token_accuracy": 0.7540312886238099, + "num_tokens": 119543215.0, + "step": 51720 + }, + { + "epoch": 0.474282570826075, + "learning_rate": 0.00010514531951957459, + "loss": 0.8612, + "mean_token_accuracy": 0.7419944047927857, + "num_tokens": 119565829.0, + "step": 51730 + }, + { + "epoch": 0.47437425506555425, + "learning_rate": 0.00010512698267167875, + "loss": 0.8483, + "mean_token_accuracy": 0.7489297389984131, + "num_tokens": 119588959.0, + "step": 51740 + }, + { + "epoch": 0.47446593930503345, + "learning_rate": 0.0001051086458237829, + "loss": 0.8264, + "mean_token_accuracy": 0.7514209091663361, + "num_tokens": 119611914.0, + "step": 51750 + }, + { + "epoch": 0.4745576235445127, + "learning_rate": 0.00010509030897588706, + "loss": 0.8446, + "mean_token_accuracy": 0.745944368839264, + "num_tokens": 119635176.0, + "step": 51760 + }, + { + "epoch": 0.47464930778399195, + "learning_rate": 0.00010507197212799121, + "loss": 0.8602, + "mean_token_accuracy": 0.7430785715579986, + "num_tokens": 119657685.0, + "step": 51770 + }, + { + "epoch": 0.47474099202347114, + "learning_rate": 0.00010505363528009535, + "loss": 0.8348, + "mean_token_accuracy": 0.7516210675239563, + "num_tokens": 119680720.0, + "step": 51780 + }, + { + "epoch": 0.4748326762629504, + "learning_rate": 0.0001050352984321995, + "loss": 0.8301, + "mean_token_accuracy": 0.7496432542800904, + "num_tokens": 119703871.0, + "step": 51790 + }, + { + "epoch": 0.47492436050242964, + "learning_rate": 0.00010501696158430365, + "loss": 0.8379, + "mean_token_accuracy": 0.7499487519264221, + "num_tokens": 119726436.0, + "step": 51800 + }, + { + "epoch": 0.47501604474190884, + "learning_rate": 0.00010499862473640783, + "loss": 0.8547, + "mean_token_accuracy": 0.7385568976402282, + "num_tokens": 119749559.0, + "step": 51810 + }, + { + "epoch": 0.4751077289813881, + "learning_rate": 0.00010498028788851198, + "loss": 0.8496, + "mean_token_accuracy": 0.7408250153064728, + "num_tokens": 119772661.0, + "step": 51820 + }, + { + "epoch": 0.47519941322086734, + "learning_rate": 0.00010496195104061612, + "loss": 0.8455, + "mean_token_accuracy": 0.7459851145744324, + "num_tokens": 119795952.0, + "step": 51830 + }, + { + "epoch": 0.4752910974603466, + "learning_rate": 0.00010494361419272027, + "loss": 0.8395, + "mean_token_accuracy": 0.7483327984809875, + "num_tokens": 119819648.0, + "step": 51840 + }, + { + "epoch": 0.4753827816998258, + "learning_rate": 0.00010492527734482442, + "loss": 0.8633, + "mean_token_accuracy": 0.7430233657360077, + "num_tokens": 119843115.0, + "step": 51850 + }, + { + "epoch": 0.47547446593930504, + "learning_rate": 0.00010490694049692857, + "loss": 0.8822, + "mean_token_accuracy": 0.7394209146499634, + "num_tokens": 119866523.0, + "step": 51860 + }, + { + "epoch": 0.4755661501787843, + "learning_rate": 0.00010488860364903274, + "loss": 0.8444, + "mean_token_accuracy": 0.7485830128192902, + "num_tokens": 119890122.0, + "step": 51870 + }, + { + "epoch": 0.4756578344182635, + "learning_rate": 0.00010487026680113689, + "loss": 0.8181, + "mean_token_accuracy": 0.7529316782951355, + "num_tokens": 119913204.0, + "step": 51880 + }, + { + "epoch": 0.47574951865774273, + "learning_rate": 0.00010485192995324104, + "loss": 0.8844, + "mean_token_accuracy": 0.7386928558349609, + "num_tokens": 119937298.0, + "step": 51890 + }, + { + "epoch": 0.475841202897222, + "learning_rate": 0.0001048335931053452, + "loss": 0.8305, + "mean_token_accuracy": 0.7530156075954437, + "num_tokens": 119960987.0, + "step": 51900 + }, + { + "epoch": 0.4759328871367012, + "learning_rate": 0.00010481525625744935, + "loss": 0.8356, + "mean_token_accuracy": 0.7472600281238556, + "num_tokens": 119984511.0, + "step": 51910 + }, + { + "epoch": 0.4760245713761804, + "learning_rate": 0.0001047969194095535, + "loss": 0.8523, + "mean_token_accuracy": 0.7455800354480744, + "num_tokens": 120007621.0, + "step": 51920 + }, + { + "epoch": 0.4761162556156597, + "learning_rate": 0.00010477858256165765, + "loss": 0.8178, + "mean_token_accuracy": 0.7557486116886138, + "num_tokens": 120030561.0, + "step": 51930 + }, + { + "epoch": 0.47620793985513893, + "learning_rate": 0.00010476024571376182, + "loss": 0.86, + "mean_token_accuracy": 0.7437947511672973, + "num_tokens": 120053788.0, + "step": 51940 + }, + { + "epoch": 0.4762996240946181, + "learning_rate": 0.00010474190886586597, + "loss": 0.8248, + "mean_token_accuracy": 0.7512517213821411, + "num_tokens": 120077500.0, + "step": 51950 + }, + { + "epoch": 0.4763913083340974, + "learning_rate": 0.00010472357201797012, + "loss": 0.8552, + "mean_token_accuracy": 0.7436775326728821, + "num_tokens": 120100246.0, + "step": 51960 + }, + { + "epoch": 0.4764829925735766, + "learning_rate": 0.00010470523517007427, + "loss": 0.8117, + "mean_token_accuracy": 0.7532978773117065, + "num_tokens": 120123221.0, + "step": 51970 + }, + { + "epoch": 0.4765746768130558, + "learning_rate": 0.00010468689832217841, + "loss": 0.8155, + "mean_token_accuracy": 0.7556072354316712, + "num_tokens": 120145683.0, + "step": 51980 + }, + { + "epoch": 0.47666636105253507, + "learning_rate": 0.00010466856147428256, + "loss": 0.8219, + "mean_token_accuracy": 0.7522577106952667, + "num_tokens": 120169455.0, + "step": 51990 + }, + { + "epoch": 0.4767580452920143, + "learning_rate": 0.00010465022462638674, + "loss": 0.8117, + "mean_token_accuracy": 0.7569294095039367, + "num_tokens": 120192384.0, + "step": 52000 + }, + { + "epoch": 0.4768497295314935, + "learning_rate": 0.0001046318877784909, + "loss": 0.8605, + "mean_token_accuracy": 0.742826646566391, + "num_tokens": 120215179.0, + "step": 52010 + }, + { + "epoch": 0.47694141377097277, + "learning_rate": 0.00010461355093059505, + "loss": 0.8067, + "mean_token_accuracy": 0.7528352260589599, + "num_tokens": 120239227.0, + "step": 52020 + }, + { + "epoch": 0.477033098010452, + "learning_rate": 0.00010459521408269918, + "loss": 0.8394, + "mean_token_accuracy": 0.7538626313209533, + "num_tokens": 120261731.0, + "step": 52030 + }, + { + "epoch": 0.4771247822499312, + "learning_rate": 0.00010457687723480334, + "loss": 0.7721, + "mean_token_accuracy": 0.7627759158611298, + "num_tokens": 120285007.0, + "step": 52040 + }, + { + "epoch": 0.47721646648941046, + "learning_rate": 0.00010455854038690749, + "loss": 0.8051, + "mean_token_accuracy": 0.7523185551166535, + "num_tokens": 120308883.0, + "step": 52050 + }, + { + "epoch": 0.4773081507288897, + "learning_rate": 0.00010454020353901164, + "loss": 0.7912, + "mean_token_accuracy": 0.7587815761566162, + "num_tokens": 120332633.0, + "step": 52060 + }, + { + "epoch": 0.47739983496836896, + "learning_rate": 0.0001045218666911158, + "loss": 0.8111, + "mean_token_accuracy": 0.7487365424633026, + "num_tokens": 120355728.0, + "step": 52070 + }, + { + "epoch": 0.47749151920784816, + "learning_rate": 0.00010450352984321996, + "loss": 0.8223, + "mean_token_accuracy": 0.7584529757499695, + "num_tokens": 120378645.0, + "step": 52080 + }, + { + "epoch": 0.4775832034473274, + "learning_rate": 0.00010448519299532411, + "loss": 0.8527, + "mean_token_accuracy": 0.7448618650436402, + "num_tokens": 120401944.0, + "step": 52090 + }, + { + "epoch": 0.47767488768680666, + "learning_rate": 0.00010446685614742826, + "loss": 0.85, + "mean_token_accuracy": 0.7441773533821106, + "num_tokens": 120425306.0, + "step": 52100 + }, + { + "epoch": 0.47776657192628585, + "learning_rate": 0.00010444851929953241, + "loss": 0.8648, + "mean_token_accuracy": 0.7408665239810943, + "num_tokens": 120448261.0, + "step": 52110 + }, + { + "epoch": 0.4778582561657651, + "learning_rate": 0.00010443018245163656, + "loss": 0.8511, + "mean_token_accuracy": 0.7457766473293305, + "num_tokens": 120471511.0, + "step": 52120 + }, + { + "epoch": 0.47794994040524436, + "learning_rate": 0.00010441184560374073, + "loss": 0.8259, + "mean_token_accuracy": 0.7492813110351563, + "num_tokens": 120493351.0, + "step": 52130 + }, + { + "epoch": 0.47804162464472355, + "learning_rate": 0.00010439350875584488, + "loss": 0.8023, + "mean_token_accuracy": 0.7554517388343811, + "num_tokens": 120515568.0, + "step": 52140 + }, + { + "epoch": 0.4781333088842028, + "learning_rate": 0.00010437517190794903, + "loss": 0.8378, + "mean_token_accuracy": 0.7453085303306579, + "num_tokens": 120538742.0, + "step": 52150 + }, + { + "epoch": 0.47822499312368205, + "learning_rate": 0.00010435683506005318, + "loss": 0.8355, + "mean_token_accuracy": 0.7500856280326843, + "num_tokens": 120561821.0, + "step": 52160 + }, + { + "epoch": 0.47831667736316125, + "learning_rate": 0.00010433849821215734, + "loss": 0.8482, + "mean_token_accuracy": 0.7485159277915955, + "num_tokens": 120585029.0, + "step": 52170 + }, + { + "epoch": 0.4784083616026405, + "learning_rate": 0.00010432016136426148, + "loss": 0.8381, + "mean_token_accuracy": 0.747643381357193, + "num_tokens": 120607937.0, + "step": 52180 + }, + { + "epoch": 0.47850004584211975, + "learning_rate": 0.00010430182451636563, + "loss": 0.8316, + "mean_token_accuracy": 0.7510312020778656, + "num_tokens": 120629692.0, + "step": 52190 + }, + { + "epoch": 0.478591730081599, + "learning_rate": 0.0001042834876684698, + "loss": 0.7832, + "mean_token_accuracy": 0.7608694970607758, + "num_tokens": 120652411.0, + "step": 52200 + }, + { + "epoch": 0.4786834143210782, + "learning_rate": 0.00010426515082057396, + "loss": 0.8531, + "mean_token_accuracy": 0.7451915502548218, + "num_tokens": 120676303.0, + "step": 52210 + }, + { + "epoch": 0.47877509856055744, + "learning_rate": 0.00010424681397267811, + "loss": 0.8264, + "mean_token_accuracy": 0.7469135582447052, + "num_tokens": 120699746.0, + "step": 52220 + }, + { + "epoch": 0.4788667828000367, + "learning_rate": 0.00010422847712478225, + "loss": 0.811, + "mean_token_accuracy": 0.7460567653179169, + "num_tokens": 120722778.0, + "step": 52230 + }, + { + "epoch": 0.4789584670395159, + "learning_rate": 0.0001042101402768864, + "loss": 0.8275, + "mean_token_accuracy": 0.7463421106338501, + "num_tokens": 120746157.0, + "step": 52240 + }, + { + "epoch": 0.47905015127899514, + "learning_rate": 0.00010419180342899055, + "loss": 0.8263, + "mean_token_accuracy": 0.7499868214130402, + "num_tokens": 120769751.0, + "step": 52250 + }, + { + "epoch": 0.4791418355184744, + "learning_rate": 0.00010417346658109473, + "loss": 0.806, + "mean_token_accuracy": 0.7564871966838836, + "num_tokens": 120793248.0, + "step": 52260 + }, + { + "epoch": 0.4792335197579536, + "learning_rate": 0.00010415512973319887, + "loss": 0.8442, + "mean_token_accuracy": 0.7389548480510711, + "num_tokens": 120816385.0, + "step": 52270 + }, + { + "epoch": 0.47932520399743284, + "learning_rate": 0.00010413679288530302, + "loss": 0.8147, + "mean_token_accuracy": 0.7481178760528564, + "num_tokens": 120839881.0, + "step": 52280 + }, + { + "epoch": 0.4794168882369121, + "learning_rate": 0.00010411845603740717, + "loss": 0.8121, + "mean_token_accuracy": 0.7531205475330353, + "num_tokens": 120862336.0, + "step": 52290 + }, + { + "epoch": 0.4795085724763913, + "learning_rate": 0.00010410011918951132, + "loss": 0.8156, + "mean_token_accuracy": 0.7549703240394592, + "num_tokens": 120886121.0, + "step": 52300 + }, + { + "epoch": 0.47960025671587053, + "learning_rate": 0.00010408178234161548, + "loss": 0.815, + "mean_token_accuracy": 0.7477683067321778, + "num_tokens": 120908940.0, + "step": 52310 + }, + { + "epoch": 0.4796919409553498, + "learning_rate": 0.00010406344549371963, + "loss": 0.8472, + "mean_token_accuracy": 0.7484028577804566, + "num_tokens": 120932037.0, + "step": 52320 + }, + { + "epoch": 0.47978362519482903, + "learning_rate": 0.0001040451086458238, + "loss": 0.8617, + "mean_token_accuracy": 0.7395271182060241, + "num_tokens": 120954654.0, + "step": 52330 + }, + { + "epoch": 0.47987530943430823, + "learning_rate": 0.00010402677179792795, + "loss": 0.8259, + "mean_token_accuracy": 0.7498848557472229, + "num_tokens": 120978417.0, + "step": 52340 + }, + { + "epoch": 0.4799669936737875, + "learning_rate": 0.0001040084349500321, + "loss": 0.853, + "mean_token_accuracy": 0.7381206154823303, + "num_tokens": 121001792.0, + "step": 52350 + }, + { + "epoch": 0.48005867791326673, + "learning_rate": 0.00010399009810213625, + "loss": 0.7991, + "mean_token_accuracy": 0.7535934984683991, + "num_tokens": 121024543.0, + "step": 52360 + }, + { + "epoch": 0.4801503621527459, + "learning_rate": 0.0001039717612542404, + "loss": 0.833, + "mean_token_accuracy": 0.7542675793170929, + "num_tokens": 121048134.0, + "step": 52370 + }, + { + "epoch": 0.4802420463922252, + "learning_rate": 0.00010395342440634454, + "loss": 0.8424, + "mean_token_accuracy": 0.7429106175899506, + "num_tokens": 121071475.0, + "step": 52380 + }, + { + "epoch": 0.4803337306317044, + "learning_rate": 0.00010393508755844872, + "loss": 0.796, + "mean_token_accuracy": 0.7548368990421295, + "num_tokens": 121094800.0, + "step": 52390 + }, + { + "epoch": 0.4804254148711836, + "learning_rate": 0.00010391675071055287, + "loss": 0.8326, + "mean_token_accuracy": 0.7476666033267975, + "num_tokens": 121116980.0, + "step": 52400 + }, + { + "epoch": 0.48051709911066287, + "learning_rate": 0.00010389841386265702, + "loss": 0.861, + "mean_token_accuracy": 0.7479492425918579, + "num_tokens": 121139950.0, + "step": 52410 + }, + { + "epoch": 0.4806087833501421, + "learning_rate": 0.00010388007701476117, + "loss": 0.8385, + "mean_token_accuracy": 0.7493346989154815, + "num_tokens": 121163291.0, + "step": 52420 + }, + { + "epoch": 0.4807004675896213, + "learning_rate": 0.00010386174016686531, + "loss": 0.8544, + "mean_token_accuracy": 0.7546171486377716, + "num_tokens": 121185902.0, + "step": 52430 + }, + { + "epoch": 0.48079215182910057, + "learning_rate": 0.00010384340331896946, + "loss": 0.8602, + "mean_token_accuracy": 0.743706864118576, + "num_tokens": 121208699.0, + "step": 52440 + }, + { + "epoch": 0.4808838360685798, + "learning_rate": 0.00010382506647107362, + "loss": 0.8489, + "mean_token_accuracy": 0.7450501918792725, + "num_tokens": 121231698.0, + "step": 52450 + }, + { + "epoch": 0.48097552030805907, + "learning_rate": 0.0001038067296231778, + "loss": 0.853, + "mean_token_accuracy": 0.7432117164134979, + "num_tokens": 121256217.0, + "step": 52460 + }, + { + "epoch": 0.48106720454753826, + "learning_rate": 0.00010378839277528193, + "loss": 0.8337, + "mean_token_accuracy": 0.743570214509964, + "num_tokens": 121278164.0, + "step": 52470 + }, + { + "epoch": 0.4811588887870175, + "learning_rate": 0.00010377005592738609, + "loss": 0.8142, + "mean_token_accuracy": 0.7559535920619964, + "num_tokens": 121301395.0, + "step": 52480 + }, + { + "epoch": 0.48125057302649676, + "learning_rate": 0.00010375171907949024, + "loss": 0.8345, + "mean_token_accuracy": 0.751169091463089, + "num_tokens": 121324729.0, + "step": 52490 + }, + { + "epoch": 0.48134225726597596, + "learning_rate": 0.00010373338223159439, + "loss": 0.8318, + "mean_token_accuracy": 0.7524395287036896, + "num_tokens": 121347953.0, + "step": 52500 + }, + { + "epoch": 0.4814339415054552, + "learning_rate": 0.00010371504538369854, + "loss": 0.8396, + "mean_token_accuracy": 0.7450460493564606, + "num_tokens": 121371802.0, + "step": 52510 + }, + { + "epoch": 0.48152562574493446, + "learning_rate": 0.0001036967085358027, + "loss": 0.8391, + "mean_token_accuracy": 0.7463997006416321, + "num_tokens": 121394010.0, + "step": 52520 + }, + { + "epoch": 0.48161730998441366, + "learning_rate": 0.00010367837168790686, + "loss": 0.8553, + "mean_token_accuracy": 0.743210768699646, + "num_tokens": 121416354.0, + "step": 52530 + }, + { + "epoch": 0.4817089942238929, + "learning_rate": 0.00010366003484001101, + "loss": 0.855, + "mean_token_accuracy": 0.7479791879653931, + "num_tokens": 121439253.0, + "step": 52540 + }, + { + "epoch": 0.48180067846337216, + "learning_rate": 0.00010364169799211516, + "loss": 0.8827, + "mean_token_accuracy": 0.7378830492496491, + "num_tokens": 121462252.0, + "step": 52550 + }, + { + "epoch": 0.4818923627028514, + "learning_rate": 0.00010362336114421931, + "loss": 0.8453, + "mean_token_accuracy": 0.7453905045986176, + "num_tokens": 121484757.0, + "step": 52560 + }, + { + "epoch": 0.4819840469423306, + "learning_rate": 0.00010360502429632347, + "loss": 0.8349, + "mean_token_accuracy": 0.7503317594528198, + "num_tokens": 121508367.0, + "step": 52570 + }, + { + "epoch": 0.48207573118180985, + "learning_rate": 0.0001035866874484276, + "loss": 0.8188, + "mean_token_accuracy": 0.7495253026485443, + "num_tokens": 121531651.0, + "step": 52580 + }, + { + "epoch": 0.4821674154212891, + "learning_rate": 0.00010356835060053178, + "loss": 0.8608, + "mean_token_accuracy": 0.7381142377853394, + "num_tokens": 121554517.0, + "step": 52590 + }, + { + "epoch": 0.4822590996607683, + "learning_rate": 0.00010355001375263593, + "loss": 0.8246, + "mean_token_accuracy": 0.7543053805828095, + "num_tokens": 121576594.0, + "step": 52600 + }, + { + "epoch": 0.48235078390024755, + "learning_rate": 0.00010353167690474009, + "loss": 0.8567, + "mean_token_accuracy": 0.7421742618083954, + "num_tokens": 121599915.0, + "step": 52610 + }, + { + "epoch": 0.4824424681397268, + "learning_rate": 0.00010351334005684424, + "loss": 0.8347, + "mean_token_accuracy": 0.7479613125324249, + "num_tokens": 121623606.0, + "step": 52620 + }, + { + "epoch": 0.482534152379206, + "learning_rate": 0.00010349500320894838, + "loss": 0.8485, + "mean_token_accuracy": 0.7455990254878998, + "num_tokens": 121647035.0, + "step": 52630 + }, + { + "epoch": 0.48262583661868524, + "learning_rate": 0.00010347666636105253, + "loss": 0.8701, + "mean_token_accuracy": 0.7386673331260681, + "num_tokens": 121670147.0, + "step": 52640 + }, + { + "epoch": 0.4827175208581645, + "learning_rate": 0.00010345832951315671, + "loss": 0.8354, + "mean_token_accuracy": 0.7507193684577942, + "num_tokens": 121693605.0, + "step": 52650 + }, + { + "epoch": 0.4828092050976437, + "learning_rate": 0.00010343999266526086, + "loss": 0.8244, + "mean_token_accuracy": 0.7527222037315369, + "num_tokens": 121717183.0, + "step": 52660 + }, + { + "epoch": 0.48290088933712294, + "learning_rate": 0.000103421655817365, + "loss": 0.8295, + "mean_token_accuracy": 0.7455935955047608, + "num_tokens": 121739687.0, + "step": 52670 + }, + { + "epoch": 0.4829925735766022, + "learning_rate": 0.00010340331896946915, + "loss": 0.8202, + "mean_token_accuracy": 0.7583676457405091, + "num_tokens": 121761628.0, + "step": 52680 + }, + { + "epoch": 0.48308425781608144, + "learning_rate": 0.0001033849821215733, + "loss": 0.8408, + "mean_token_accuracy": 0.746461832523346, + "num_tokens": 121783805.0, + "step": 52690 + }, + { + "epoch": 0.48317594205556064, + "learning_rate": 0.00010336664527367745, + "loss": 0.8456, + "mean_token_accuracy": 0.7479347705841064, + "num_tokens": 121808213.0, + "step": 52700 + }, + { + "epoch": 0.4832676262950399, + "learning_rate": 0.0001033483084257816, + "loss": 0.8246, + "mean_token_accuracy": 0.7482814371585846, + "num_tokens": 121830679.0, + "step": 52710 + }, + { + "epoch": 0.48335931053451914, + "learning_rate": 0.00010332997157788577, + "loss": 0.8133, + "mean_token_accuracy": 0.752324515581131, + "num_tokens": 121853673.0, + "step": 52720 + }, + { + "epoch": 0.48345099477399833, + "learning_rate": 0.00010331163472998992, + "loss": 0.8391, + "mean_token_accuracy": 0.7527458786964416, + "num_tokens": 121877208.0, + "step": 52730 + }, + { + "epoch": 0.4835426790134776, + "learning_rate": 0.00010329329788209407, + "loss": 0.8248, + "mean_token_accuracy": 0.7487370789051055, + "num_tokens": 121900046.0, + "step": 52740 + }, + { + "epoch": 0.48363436325295683, + "learning_rate": 0.00010327496103419823, + "loss": 0.8196, + "mean_token_accuracy": 0.7506524980068207, + "num_tokens": 121923400.0, + "step": 52750 + }, + { + "epoch": 0.48372604749243603, + "learning_rate": 0.00010325662418630238, + "loss": 0.8323, + "mean_token_accuracy": 0.7495845139026642, + "num_tokens": 121946713.0, + "step": 52760 + }, + { + "epoch": 0.4838177317319153, + "learning_rate": 0.00010323828733840653, + "loss": 0.8181, + "mean_token_accuracy": 0.7542740881443024, + "num_tokens": 121970201.0, + "step": 52770 + }, + { + "epoch": 0.48390941597139453, + "learning_rate": 0.00010321995049051067, + "loss": 0.8181, + "mean_token_accuracy": 0.7539512097835541, + "num_tokens": 121992894.0, + "step": 52780 + }, + { + "epoch": 0.4840011002108737, + "learning_rate": 0.00010320161364261485, + "loss": 0.8546, + "mean_token_accuracy": 0.7451876163482666, + "num_tokens": 122015688.0, + "step": 52790 + }, + { + "epoch": 0.484092784450353, + "learning_rate": 0.000103183276794719, + "loss": 0.8287, + "mean_token_accuracy": 0.7509006202220917, + "num_tokens": 122038967.0, + "step": 52800 + }, + { + "epoch": 0.4841844686898322, + "learning_rate": 0.00010316493994682315, + "loss": 0.8595, + "mean_token_accuracy": 0.7380962252616883, + "num_tokens": 122061353.0, + "step": 52810 + }, + { + "epoch": 0.4842761529293115, + "learning_rate": 0.0001031466030989273, + "loss": 0.8237, + "mean_token_accuracy": 0.754196149110794, + "num_tokens": 122084477.0, + "step": 52820 + }, + { + "epoch": 0.48436783716879067, + "learning_rate": 0.00010312826625103144, + "loss": 0.8154, + "mean_token_accuracy": 0.753213620185852, + "num_tokens": 122107703.0, + "step": 52830 + }, + { + "epoch": 0.4844595214082699, + "learning_rate": 0.0001031099294031356, + "loss": 0.8276, + "mean_token_accuracy": 0.7469814538955688, + "num_tokens": 122131131.0, + "step": 52840 + }, + { + "epoch": 0.4845512056477492, + "learning_rate": 0.00010309159255523977, + "loss": 0.8162, + "mean_token_accuracy": 0.7541975140571594, + "num_tokens": 122153827.0, + "step": 52850 + }, + { + "epoch": 0.48464288988722837, + "learning_rate": 0.00010307325570734392, + "loss": 0.8775, + "mean_token_accuracy": 0.7420593559741974, + "num_tokens": 122176540.0, + "step": 52860 + }, + { + "epoch": 0.4847345741267076, + "learning_rate": 0.00010305491885944806, + "loss": 0.8406, + "mean_token_accuracy": 0.7503218650817871, + "num_tokens": 122200077.0, + "step": 52870 + }, + { + "epoch": 0.48482625836618687, + "learning_rate": 0.00010303658201155221, + "loss": 0.8824, + "mean_token_accuracy": 0.7431121945381165, + "num_tokens": 122222774.0, + "step": 52880 + }, + { + "epoch": 0.48491794260566606, + "learning_rate": 0.00010301824516365637, + "loss": 0.8375, + "mean_token_accuracy": 0.7453800857067108, + "num_tokens": 122245482.0, + "step": 52890 + }, + { + "epoch": 0.4850096268451453, + "learning_rate": 0.00010299990831576052, + "loss": 0.8432, + "mean_token_accuracy": 0.7508934795856476, + "num_tokens": 122268827.0, + "step": 52900 + }, + { + "epoch": 0.48510131108462456, + "learning_rate": 0.00010298157146786467, + "loss": 0.8268, + "mean_token_accuracy": 0.7549352049827576, + "num_tokens": 122292940.0, + "step": 52910 + }, + { + "epoch": 0.48519299532410376, + "learning_rate": 0.00010296323461996884, + "loss": 0.7945, + "mean_token_accuracy": 0.7612595319747925, + "num_tokens": 122315859.0, + "step": 52920 + }, + { + "epoch": 0.485284679563583, + "learning_rate": 0.00010294489777207299, + "loss": 0.8001, + "mean_token_accuracy": 0.7555343866348266, + "num_tokens": 122338418.0, + "step": 52930 + }, + { + "epoch": 0.48537636380306226, + "learning_rate": 0.00010292656092417714, + "loss": 0.818, + "mean_token_accuracy": 0.7511711657047272, + "num_tokens": 122362571.0, + "step": 52940 + }, + { + "epoch": 0.4854680480425415, + "learning_rate": 0.00010290822407628129, + "loss": 0.8462, + "mean_token_accuracy": 0.7403854608535767, + "num_tokens": 122386044.0, + "step": 52950 + }, + { + "epoch": 0.4855597322820207, + "learning_rate": 0.00010288988722838544, + "loss": 0.8326, + "mean_token_accuracy": 0.7513818204402923, + "num_tokens": 122409734.0, + "step": 52960 + }, + { + "epoch": 0.48565141652149996, + "learning_rate": 0.0001028715503804896, + "loss": 0.8305, + "mean_token_accuracy": 0.748537564277649, + "num_tokens": 122432414.0, + "step": 52970 + }, + { + "epoch": 0.4857431007609792, + "learning_rate": 0.00010285321353259376, + "loss": 0.8434, + "mean_token_accuracy": 0.7477980315685272, + "num_tokens": 122455862.0, + "step": 52980 + }, + { + "epoch": 0.4858347850004584, + "learning_rate": 0.00010283487668469791, + "loss": 0.8376, + "mean_token_accuracy": 0.7481094300746918, + "num_tokens": 122478776.0, + "step": 52990 + }, + { + "epoch": 0.48592646923993765, + "learning_rate": 0.00010281653983680206, + "loss": 0.7979, + "mean_token_accuracy": 0.7605419218540191, + "num_tokens": 122502337.0, + "step": 53000 + }, + { + "epoch": 0.4860181534794169, + "learning_rate": 0.00010279820298890622, + "loss": 0.8217, + "mean_token_accuracy": 0.7488216757774353, + "num_tokens": 122527045.0, + "step": 53010 + }, + { + "epoch": 0.4861098377188961, + "learning_rate": 0.00010277986614101037, + "loss": 0.8262, + "mean_token_accuracy": 0.7520414590835571, + "num_tokens": 122550180.0, + "step": 53020 + }, + { + "epoch": 0.48620152195837535, + "learning_rate": 0.0001027615292931145, + "loss": 0.8614, + "mean_token_accuracy": 0.7416727066040039, + "num_tokens": 122573166.0, + "step": 53030 + }, + { + "epoch": 0.4862932061978546, + "learning_rate": 0.00010274319244521866, + "loss": 0.838, + "mean_token_accuracy": 0.7475881159305573, + "num_tokens": 122597039.0, + "step": 53040 + }, + { + "epoch": 0.48638489043733385, + "learning_rate": 0.00010272485559732284, + "loss": 0.8538, + "mean_token_accuracy": 0.7462023854255676, + "num_tokens": 122620075.0, + "step": 53050 + }, + { + "epoch": 0.48647657467681304, + "learning_rate": 0.00010270651874942699, + "loss": 0.8641, + "mean_token_accuracy": 0.7412254214286804, + "num_tokens": 122643227.0, + "step": 53060 + }, + { + "epoch": 0.4865682589162923, + "learning_rate": 0.00010268818190153113, + "loss": 0.8427, + "mean_token_accuracy": 0.7480344295501709, + "num_tokens": 122666324.0, + "step": 53070 + }, + { + "epoch": 0.48665994315577155, + "learning_rate": 0.00010266984505363528, + "loss": 0.8588, + "mean_token_accuracy": 0.7418996036052704, + "num_tokens": 122690440.0, + "step": 53080 + }, + { + "epoch": 0.48675162739525074, + "learning_rate": 0.00010265150820573943, + "loss": 0.8128, + "mean_token_accuracy": 0.7535100996494293, + "num_tokens": 122714101.0, + "step": 53090 + }, + { + "epoch": 0.48684331163473, + "learning_rate": 0.00010263317135784358, + "loss": 0.8647, + "mean_token_accuracy": 0.7431944847106934, + "num_tokens": 122737056.0, + "step": 53100 + }, + { + "epoch": 0.48693499587420924, + "learning_rate": 0.00010261483450994776, + "loss": 0.8615, + "mean_token_accuracy": 0.7404684543609619, + "num_tokens": 122759933.0, + "step": 53110 + }, + { + "epoch": 0.48702668011368844, + "learning_rate": 0.0001025964976620519, + "loss": 0.8289, + "mean_token_accuracy": 0.7526221632957458, + "num_tokens": 122783701.0, + "step": 53120 + }, + { + "epoch": 0.4871183643531677, + "learning_rate": 0.00010257816081415605, + "loss": 0.8472, + "mean_token_accuracy": 0.7498015403747559, + "num_tokens": 122806347.0, + "step": 53130 + }, + { + "epoch": 0.48721004859264694, + "learning_rate": 0.0001025598239662602, + "loss": 0.837, + "mean_token_accuracy": 0.7467487394809723, + "num_tokens": 122829849.0, + "step": 53140 + }, + { + "epoch": 0.48730173283212613, + "learning_rate": 0.00010254148711836436, + "loss": 0.8365, + "mean_token_accuracy": 0.7487476229667663, + "num_tokens": 122852790.0, + "step": 53150 + }, + { + "epoch": 0.4873934170716054, + "learning_rate": 0.00010252315027046851, + "loss": 0.8493, + "mean_token_accuracy": 0.7416711390018463, + "num_tokens": 122876160.0, + "step": 53160 + }, + { + "epoch": 0.48748510131108463, + "learning_rate": 0.00010250481342257266, + "loss": 0.8168, + "mean_token_accuracy": 0.7511836946010589, + "num_tokens": 122899198.0, + "step": 53170 + }, + { + "epoch": 0.4875767855505639, + "learning_rate": 0.00010248647657467682, + "loss": 0.8041, + "mean_token_accuracy": 0.7555497586727142, + "num_tokens": 122922624.0, + "step": 53180 + }, + { + "epoch": 0.4876684697900431, + "learning_rate": 0.00010246813972678098, + "loss": 0.8351, + "mean_token_accuracy": 0.7509292483329773, + "num_tokens": 122945964.0, + "step": 53190 + }, + { + "epoch": 0.48776015402952233, + "learning_rate": 0.00010244980287888513, + "loss": 0.8352, + "mean_token_accuracy": 0.7502477407455445, + "num_tokens": 122968305.0, + "step": 53200 + }, + { + "epoch": 0.4878518382690016, + "learning_rate": 0.00010243146603098928, + "loss": 0.8207, + "mean_token_accuracy": 0.7479778409004212, + "num_tokens": 122991402.0, + "step": 53210 + }, + { + "epoch": 0.4879435225084808, + "learning_rate": 0.00010241312918309343, + "loss": 0.8344, + "mean_token_accuracy": 0.7482169210910797, + "num_tokens": 123013809.0, + "step": 53220 + }, + { + "epoch": 0.48803520674796, + "learning_rate": 0.00010239479233519757, + "loss": 0.8012, + "mean_token_accuracy": 0.7504085719585418, + "num_tokens": 123037355.0, + "step": 53230 + }, + { + "epoch": 0.4881268909874393, + "learning_rate": 0.00010237645548730175, + "loss": 0.8286, + "mean_token_accuracy": 0.754689735174179, + "num_tokens": 123060883.0, + "step": 53240 + }, + { + "epoch": 0.48821857522691847, + "learning_rate": 0.0001023581186394059, + "loss": 0.8821, + "mean_token_accuracy": 0.7471439480781555, + "num_tokens": 123083718.0, + "step": 53250 + }, + { + "epoch": 0.4883102594663977, + "learning_rate": 0.00010233978179151005, + "loss": 0.8211, + "mean_token_accuracy": 0.7488535463809967, + "num_tokens": 123108286.0, + "step": 53260 + }, + { + "epoch": 0.488401943705877, + "learning_rate": 0.00010232144494361419, + "loss": 0.8447, + "mean_token_accuracy": 0.7493493914604187, + "num_tokens": 123130644.0, + "step": 53270 + }, + { + "epoch": 0.48849362794535617, + "learning_rate": 0.00010230310809571834, + "loss": 0.8265, + "mean_token_accuracy": 0.7495214402675628, + "num_tokens": 123153605.0, + "step": 53280 + }, + { + "epoch": 0.4885853121848354, + "learning_rate": 0.0001022847712478225, + "loss": 0.852, + "mean_token_accuracy": 0.7408915996551514, + "num_tokens": 123176943.0, + "step": 53290 + }, + { + "epoch": 0.48867699642431467, + "learning_rate": 0.00010226643439992665, + "loss": 0.8617, + "mean_token_accuracy": 0.7433248281478881, + "num_tokens": 123200250.0, + "step": 53300 + }, + { + "epoch": 0.4887686806637939, + "learning_rate": 0.00010224809755203083, + "loss": 0.8116, + "mean_token_accuracy": 0.7507937252521515, + "num_tokens": 123223883.0, + "step": 53310 + }, + { + "epoch": 0.4888603649032731, + "learning_rate": 0.00010222976070413496, + "loss": 0.7952, + "mean_token_accuracy": 0.7581035494804382, + "num_tokens": 123246988.0, + "step": 53320 + }, + { + "epoch": 0.48895204914275237, + "learning_rate": 0.00010221142385623912, + "loss": 0.8105, + "mean_token_accuracy": 0.7543392360210419, + "num_tokens": 123269938.0, + "step": 53330 + }, + { + "epoch": 0.4890437333822316, + "learning_rate": 0.00010219308700834327, + "loss": 0.8474, + "mean_token_accuracy": 0.7448423445224762, + "num_tokens": 123292687.0, + "step": 53340 + }, + { + "epoch": 0.4891354176217108, + "learning_rate": 0.00010217475016044742, + "loss": 0.8544, + "mean_token_accuracy": 0.7385833621025085, + "num_tokens": 123315907.0, + "step": 53350 + }, + { + "epoch": 0.48922710186119006, + "learning_rate": 0.00010215641331255157, + "loss": 0.8205, + "mean_token_accuracy": 0.7468352377414703, + "num_tokens": 123339611.0, + "step": 53360 + }, + { + "epoch": 0.4893187861006693, + "learning_rate": 0.00010213807646465574, + "loss": 0.8317, + "mean_token_accuracy": 0.7495156407356263, + "num_tokens": 123362280.0, + "step": 53370 + }, + { + "epoch": 0.4894104703401485, + "learning_rate": 0.00010211973961675989, + "loss": 0.8107, + "mean_token_accuracy": 0.7533836543560029, + "num_tokens": 123385607.0, + "step": 53380 + }, + { + "epoch": 0.48950215457962776, + "learning_rate": 0.00010210140276886404, + "loss": 0.874, + "mean_token_accuracy": 0.7377766191959381, + "num_tokens": 123408402.0, + "step": 53390 + }, + { + "epoch": 0.489593838819107, + "learning_rate": 0.00010208306592096819, + "loss": 0.8772, + "mean_token_accuracy": 0.7404467165470123, + "num_tokens": 123430836.0, + "step": 53400 + }, + { + "epoch": 0.4896855230585862, + "learning_rate": 0.00010206472907307234, + "loss": 0.8328, + "mean_token_accuracy": 0.7528629839420319, + "num_tokens": 123454242.0, + "step": 53410 + }, + { + "epoch": 0.48977720729806545, + "learning_rate": 0.0001020463922251765, + "loss": 0.8507, + "mean_token_accuracy": 0.745625376701355, + "num_tokens": 123476968.0, + "step": 53420 + }, + { + "epoch": 0.4898688915375447, + "learning_rate": 0.00010202805537728063, + "loss": 0.8218, + "mean_token_accuracy": 0.7525958836078643, + "num_tokens": 123500200.0, + "step": 53430 + }, + { + "epoch": 0.48996057577702395, + "learning_rate": 0.00010200971852938481, + "loss": 0.8293, + "mean_token_accuracy": 0.7544655859470367, + "num_tokens": 123522379.0, + "step": 53440 + }, + { + "epoch": 0.49005226001650315, + "learning_rate": 0.00010199138168148897, + "loss": 0.8846, + "mean_token_accuracy": 0.7418582677841187, + "num_tokens": 123545390.0, + "step": 53450 + }, + { + "epoch": 0.4901439442559824, + "learning_rate": 0.00010197304483359312, + "loss": 0.8351, + "mean_token_accuracy": 0.7502604067325592, + "num_tokens": 123568907.0, + "step": 53460 + }, + { + "epoch": 0.49023562849546165, + "learning_rate": 0.00010195470798569726, + "loss": 0.8351, + "mean_token_accuracy": 0.7447330892086029, + "num_tokens": 123591722.0, + "step": 53470 + }, + { + "epoch": 0.49032731273494085, + "learning_rate": 0.00010193637113780141, + "loss": 0.8554, + "mean_token_accuracy": 0.7416792869567871, + "num_tokens": 123615097.0, + "step": 53480 + }, + { + "epoch": 0.4904189969744201, + "learning_rate": 0.00010191803428990556, + "loss": 0.8703, + "mean_token_accuracy": 0.7404252707958221, + "num_tokens": 123638149.0, + "step": 53490 + }, + { + "epoch": 0.49051068121389935, + "learning_rate": 0.00010189969744200974, + "loss": 0.8523, + "mean_token_accuracy": 0.7452394545078278, + "num_tokens": 123661313.0, + "step": 53500 + }, + { + "epoch": 0.49060236545337854, + "learning_rate": 0.00010188136059411389, + "loss": 0.8757, + "mean_token_accuracy": 0.7413649797439575, + "num_tokens": 123683722.0, + "step": 53510 + }, + { + "epoch": 0.4906940496928578, + "learning_rate": 0.00010186302374621803, + "loss": 0.8553, + "mean_token_accuracy": 0.7450942695140839, + "num_tokens": 123706555.0, + "step": 53520 + }, + { + "epoch": 0.49078573393233704, + "learning_rate": 0.00010184468689832218, + "loss": 0.8547, + "mean_token_accuracy": 0.7429875314235688, + "num_tokens": 123729654.0, + "step": 53530 + }, + { + "epoch": 0.49087741817181624, + "learning_rate": 0.00010182635005042633, + "loss": 0.8255, + "mean_token_accuracy": 0.7533956587314605, + "num_tokens": 123752547.0, + "step": 53540 + }, + { + "epoch": 0.4909691024112955, + "learning_rate": 0.00010180801320253048, + "loss": 0.8521, + "mean_token_accuracy": 0.7497077524662018, + "num_tokens": 123775174.0, + "step": 53550 + }, + { + "epoch": 0.49106078665077474, + "learning_rate": 0.00010178967635463464, + "loss": 0.8499, + "mean_token_accuracy": 0.748982959985733, + "num_tokens": 123798753.0, + "step": 53560 + }, + { + "epoch": 0.491152470890254, + "learning_rate": 0.0001017713395067388, + "loss": 0.8261, + "mean_token_accuracy": 0.7488219320774079, + "num_tokens": 123821854.0, + "step": 53570 + }, + { + "epoch": 0.4912441551297332, + "learning_rate": 0.00010175300265884295, + "loss": 0.8274, + "mean_token_accuracy": 0.7435190796852111, + "num_tokens": 123845987.0, + "step": 53580 + }, + { + "epoch": 0.49133583936921243, + "learning_rate": 0.0001017346658109471, + "loss": 0.8145, + "mean_token_accuracy": 0.7536229133605957, + "num_tokens": 123869171.0, + "step": 53590 + }, + { + "epoch": 0.4914275236086917, + "learning_rate": 0.00010171632896305126, + "loss": 0.8453, + "mean_token_accuracy": 0.7433777451515198, + "num_tokens": 123891472.0, + "step": 53600 + }, + { + "epoch": 0.4915192078481709, + "learning_rate": 0.00010169799211515541, + "loss": 0.8101, + "mean_token_accuracy": 0.7552849471569061, + "num_tokens": 123914707.0, + "step": 53610 + }, + { + "epoch": 0.49161089208765013, + "learning_rate": 0.00010167965526725956, + "loss": 0.8462, + "mean_token_accuracy": 0.7565894305706025, + "num_tokens": 123938036.0, + "step": 53620 + }, + { + "epoch": 0.4917025763271294, + "learning_rate": 0.00010166131841936373, + "loss": 0.8168, + "mean_token_accuracy": 0.7446473956108093, + "num_tokens": 123960850.0, + "step": 53630 + }, + { + "epoch": 0.4917942605666086, + "learning_rate": 0.00010164298157146788, + "loss": 0.9007, + "mean_token_accuracy": 0.7369200766086579, + "num_tokens": 123983908.0, + "step": 53640 + }, + { + "epoch": 0.4918859448060878, + "learning_rate": 0.00010162464472357203, + "loss": 0.8374, + "mean_token_accuracy": 0.7470629513263702, + "num_tokens": 124006825.0, + "step": 53650 + }, + { + "epoch": 0.4919776290455671, + "learning_rate": 0.00010160630787567618, + "loss": 0.8299, + "mean_token_accuracy": 0.7514701068401337, + "num_tokens": 124030247.0, + "step": 53660 + }, + { + "epoch": 0.49206931328504633, + "learning_rate": 0.00010158797102778032, + "loss": 0.813, + "mean_token_accuracy": 0.7538914799690246, + "num_tokens": 124053670.0, + "step": 53670 + }, + { + "epoch": 0.4921609975245255, + "learning_rate": 0.00010156963417988447, + "loss": 0.8503, + "mean_token_accuracy": 0.7473560988903045, + "num_tokens": 124077408.0, + "step": 53680 + }, + { + "epoch": 0.4922526817640048, + "learning_rate": 0.00010155129733198862, + "loss": 0.864, + "mean_token_accuracy": 0.7408625245094299, + "num_tokens": 124100296.0, + "step": 53690 + }, + { + "epoch": 0.492344366003484, + "learning_rate": 0.0001015329604840928, + "loss": 0.8428, + "mean_token_accuracy": 0.7433066725730896, + "num_tokens": 124124254.0, + "step": 53700 + }, + { + "epoch": 0.4924360502429632, + "learning_rate": 0.00010151462363619695, + "loss": 0.8383, + "mean_token_accuracy": 0.752090334892273, + "num_tokens": 124147370.0, + "step": 53710 + }, + { + "epoch": 0.49252773448244247, + "learning_rate": 0.00010149628678830109, + "loss": 0.8395, + "mean_token_accuracy": 0.7413933634757995, + "num_tokens": 124170302.0, + "step": 53720 + }, + { + "epoch": 0.4926194187219217, + "learning_rate": 0.00010147794994040525, + "loss": 0.8595, + "mean_token_accuracy": 0.7450426995754242, + "num_tokens": 124192812.0, + "step": 53730 + }, + { + "epoch": 0.4927111029614009, + "learning_rate": 0.0001014596130925094, + "loss": 0.8206, + "mean_token_accuracy": 0.7579657852649688, + "num_tokens": 124216287.0, + "step": 53740 + }, + { + "epoch": 0.49280278720088017, + "learning_rate": 0.00010144127624461355, + "loss": 0.8173, + "mean_token_accuracy": 0.7462433695793151, + "num_tokens": 124240432.0, + "step": 53750 + }, + { + "epoch": 0.4928944714403594, + "learning_rate": 0.00010142293939671771, + "loss": 0.8427, + "mean_token_accuracy": 0.7429296374320984, + "num_tokens": 124263116.0, + "step": 53760 + }, + { + "epoch": 0.4929861556798386, + "learning_rate": 0.00010140460254882187, + "loss": 0.8656, + "mean_token_accuracy": 0.7424785375595093, + "num_tokens": 124285638.0, + "step": 53770 + }, + { + "epoch": 0.49307783991931786, + "learning_rate": 0.00010138626570092602, + "loss": 0.8563, + "mean_token_accuracy": 0.7357562601566314, + "num_tokens": 124308847.0, + "step": 53780 + }, + { + "epoch": 0.4931695241587971, + "learning_rate": 0.00010136792885303017, + "loss": 0.8332, + "mean_token_accuracy": 0.7508998870849609, + "num_tokens": 124331689.0, + "step": 53790 + }, + { + "epoch": 0.49326120839827636, + "learning_rate": 0.00010134959200513432, + "loss": 0.8947, + "mean_token_accuracy": 0.7394472539424897, + "num_tokens": 124354817.0, + "step": 53800 + }, + { + "epoch": 0.49335289263775556, + "learning_rate": 0.00010133125515723847, + "loss": 0.8218, + "mean_token_accuracy": 0.7496876776218414, + "num_tokens": 124379230.0, + "step": 53810 + }, + { + "epoch": 0.4934445768772348, + "learning_rate": 0.00010131291830934263, + "loss": 0.8401, + "mean_token_accuracy": 0.7517239868640899, + "num_tokens": 124401885.0, + "step": 53820 + }, + { + "epoch": 0.49353626111671406, + "learning_rate": 0.00010129458146144679, + "loss": 0.9133, + "mean_token_accuracy": 0.7294662594795227, + "num_tokens": 124424534.0, + "step": 53830 + }, + { + "epoch": 0.49362794535619325, + "learning_rate": 0.00010127624461355094, + "loss": 0.8519, + "mean_token_accuracy": 0.7492198050022125, + "num_tokens": 124448015.0, + "step": 53840 + }, + { + "epoch": 0.4937196295956725, + "learning_rate": 0.0001012579077656551, + "loss": 0.8727, + "mean_token_accuracy": 0.7425671398639679, + "num_tokens": 124470790.0, + "step": 53850 + }, + { + "epoch": 0.49381131383515176, + "learning_rate": 0.00010123957091775925, + "loss": 0.8732, + "mean_token_accuracy": 0.7382482171058655, + "num_tokens": 124493253.0, + "step": 53860 + }, + { + "epoch": 0.49390299807463095, + "learning_rate": 0.00010122123406986338, + "loss": 0.845, + "mean_token_accuracy": 0.7456029891967774, + "num_tokens": 124516663.0, + "step": 53870 + }, + { + "epoch": 0.4939946823141102, + "learning_rate": 0.00010120289722196754, + "loss": 0.8595, + "mean_token_accuracy": 0.7506387591361999, + "num_tokens": 124539985.0, + "step": 53880 + }, + { + "epoch": 0.49408636655358945, + "learning_rate": 0.00010118456037407172, + "loss": 0.8231, + "mean_token_accuracy": 0.7518276274204254, + "num_tokens": 124562657.0, + "step": 53890 + }, + { + "epoch": 0.49417805079306865, + "learning_rate": 0.00010116622352617587, + "loss": 0.8218, + "mean_token_accuracy": 0.7578824937343598, + "num_tokens": 124586201.0, + "step": 53900 + }, + { + "epoch": 0.4942697350325479, + "learning_rate": 0.00010114788667828002, + "loss": 0.8031, + "mean_token_accuracy": 0.7554262220859528, + "num_tokens": 124610078.0, + "step": 53910 + }, + { + "epoch": 0.49436141927202715, + "learning_rate": 0.00010112954983038416, + "loss": 0.8343, + "mean_token_accuracy": 0.7464954614639282, + "num_tokens": 124633249.0, + "step": 53920 + }, + { + "epoch": 0.4944531035115064, + "learning_rate": 0.00010111121298248831, + "loss": 0.8002, + "mean_token_accuracy": 0.7635982513427735, + "num_tokens": 124656943.0, + "step": 53930 + }, + { + "epoch": 0.4945447877509856, + "learning_rate": 0.00010109287613459246, + "loss": 0.8482, + "mean_token_accuracy": 0.7445980846881867, + "num_tokens": 124680625.0, + "step": 53940 + }, + { + "epoch": 0.49463647199046484, + "learning_rate": 0.00010107453928669661, + "loss": 0.815, + "mean_token_accuracy": 0.7551271378993988, + "num_tokens": 124703669.0, + "step": 53950 + }, + { + "epoch": 0.4947281562299441, + "learning_rate": 0.00010105620243880078, + "loss": 0.8597, + "mean_token_accuracy": 0.7429558396339416, + "num_tokens": 124726885.0, + "step": 53960 + }, + { + "epoch": 0.4948198404694233, + "learning_rate": 0.00010103786559090493, + "loss": 0.8625, + "mean_token_accuracy": 0.7451183259487152, + "num_tokens": 124750499.0, + "step": 53970 + }, + { + "epoch": 0.49491152470890254, + "learning_rate": 0.00010101952874300908, + "loss": 0.8971, + "mean_token_accuracy": 0.7334162175655365, + "num_tokens": 124773676.0, + "step": 53980 + }, + { + "epoch": 0.4950032089483818, + "learning_rate": 0.00010100119189511323, + "loss": 0.8321, + "mean_token_accuracy": 0.7451906800270081, + "num_tokens": 124796337.0, + "step": 53990 + }, + { + "epoch": 0.495094893187861, + "learning_rate": 0.00010098285504721739, + "loss": 0.7969, + "mean_token_accuracy": 0.7585631549358368, + "num_tokens": 124819339.0, + "step": 54000 + }, + { + "epoch": 0.49518657742734024, + "learning_rate": 0.00010096451819932154, + "loss": 0.827, + "mean_token_accuracy": 0.7474742352962493, + "num_tokens": 124842774.0, + "step": 54010 + }, + { + "epoch": 0.4952782616668195, + "learning_rate": 0.00010094618135142569, + "loss": 0.8344, + "mean_token_accuracy": 0.7424811363220215, + "num_tokens": 124866459.0, + "step": 54020 + }, + { + "epoch": 0.4953699459062987, + "learning_rate": 0.00010092784450352986, + "loss": 0.8353, + "mean_token_accuracy": 0.7505001127719879, + "num_tokens": 124889371.0, + "step": 54030 + }, + { + "epoch": 0.49546163014577793, + "learning_rate": 0.00010090950765563401, + "loss": 0.8579, + "mean_token_accuracy": 0.7487920939922332, + "num_tokens": 124913372.0, + "step": 54040 + }, + { + "epoch": 0.4955533143852572, + "learning_rate": 0.00010089117080773816, + "loss": 0.8328, + "mean_token_accuracy": 0.7490865528583527, + "num_tokens": 124936404.0, + "step": 54050 + }, + { + "epoch": 0.49564499862473643, + "learning_rate": 0.00010087283395984231, + "loss": 0.8405, + "mean_token_accuracy": 0.7462813854217529, + "num_tokens": 124960577.0, + "step": 54060 + }, + { + "epoch": 0.4957366828642156, + "learning_rate": 0.00010085449711194645, + "loss": 0.8397, + "mean_token_accuracy": 0.7449421465396882, + "num_tokens": 124983439.0, + "step": 54070 + }, + { + "epoch": 0.4958283671036949, + "learning_rate": 0.0001008361602640506, + "loss": 0.8138, + "mean_token_accuracy": 0.7517531335353851, + "num_tokens": 125006546.0, + "step": 54080 + }, + { + "epoch": 0.49592005134317413, + "learning_rate": 0.00010081782341615478, + "loss": 0.839, + "mean_token_accuracy": 0.7510481238365173, + "num_tokens": 125029454.0, + "step": 54090 + }, + { + "epoch": 0.4960117355826533, + "learning_rate": 0.00010079948656825893, + "loss": 0.8402, + "mean_token_accuracy": 0.7541648924350739, + "num_tokens": 125051516.0, + "step": 54100 + }, + { + "epoch": 0.4961034198221326, + "learning_rate": 0.00010078114972036308, + "loss": 0.8322, + "mean_token_accuracy": 0.748639988899231, + "num_tokens": 125074623.0, + "step": 54110 + }, + { + "epoch": 0.4961951040616118, + "learning_rate": 0.00010076281287246722, + "loss": 0.8382, + "mean_token_accuracy": 0.751268619298935, + "num_tokens": 125097413.0, + "step": 54120 + }, + { + "epoch": 0.496286788301091, + "learning_rate": 0.00010074447602457137, + "loss": 0.8972, + "mean_token_accuracy": 0.7367906272411346, + "num_tokens": 125120365.0, + "step": 54130 + }, + { + "epoch": 0.49637847254057027, + "learning_rate": 0.00010072613917667553, + "loss": 0.8189, + "mean_token_accuracy": 0.7522039532661438, + "num_tokens": 125143300.0, + "step": 54140 + }, + { + "epoch": 0.4964701567800495, + "learning_rate": 0.00010070780232877968, + "loss": 0.837, + "mean_token_accuracy": 0.7452004492282868, + "num_tokens": 125165646.0, + "step": 54150 + }, + { + "epoch": 0.4965618410195287, + "learning_rate": 0.00010068946548088384, + "loss": 0.8293, + "mean_token_accuracy": 0.7507408201694489, + "num_tokens": 125187671.0, + "step": 54160 + }, + { + "epoch": 0.49665352525900797, + "learning_rate": 0.000100671128632988, + "loss": 0.8436, + "mean_token_accuracy": 0.7435282468795776, + "num_tokens": 125209892.0, + "step": 54170 + }, + { + "epoch": 0.4967452094984872, + "learning_rate": 0.00010065279178509215, + "loss": 0.8135, + "mean_token_accuracy": 0.754814600944519, + "num_tokens": 125232710.0, + "step": 54180 + }, + { + "epoch": 0.49683689373796647, + "learning_rate": 0.0001006344549371963, + "loss": 0.8446, + "mean_token_accuracy": 0.7491725504398346, + "num_tokens": 125255023.0, + "step": 54190 + }, + { + "epoch": 0.49692857797744566, + "learning_rate": 0.00010061611808930045, + "loss": 0.8191, + "mean_token_accuracy": 0.7464327573776245, + "num_tokens": 125278048.0, + "step": 54200 + }, + { + "epoch": 0.4970202622169249, + "learning_rate": 0.0001005977812414046, + "loss": 0.8353, + "mean_token_accuracy": 0.7493406713008881, + "num_tokens": 125302133.0, + "step": 54210 + }, + { + "epoch": 0.49711194645640416, + "learning_rate": 0.00010057944439350877, + "loss": 0.8163, + "mean_token_accuracy": 0.7528886139392853, + "num_tokens": 125325039.0, + "step": 54220 + }, + { + "epoch": 0.49720363069588336, + "learning_rate": 0.00010056110754561292, + "loss": 0.7919, + "mean_token_accuracy": 0.7638591527938843, + "num_tokens": 125348243.0, + "step": 54230 + }, + { + "epoch": 0.4972953149353626, + "learning_rate": 0.00010054277069771707, + "loss": 0.82, + "mean_token_accuracy": 0.7532366871833801, + "num_tokens": 125370526.0, + "step": 54240 + }, + { + "epoch": 0.49738699917484186, + "learning_rate": 0.00010052443384982122, + "loss": 0.8248, + "mean_token_accuracy": 0.7459402322769165, + "num_tokens": 125393716.0, + "step": 54250 + }, + { + "epoch": 0.49747868341432105, + "learning_rate": 0.00010050609700192538, + "loss": 0.8025, + "mean_token_accuracy": 0.759676319360733, + "num_tokens": 125416768.0, + "step": 54260 + }, + { + "epoch": 0.4975703676538003, + "learning_rate": 0.00010048776015402951, + "loss": 0.8581, + "mean_token_accuracy": 0.7408665359020233, + "num_tokens": 125439528.0, + "step": 54270 + }, + { + "epoch": 0.49766205189327956, + "learning_rate": 0.00010046942330613367, + "loss": 0.8084, + "mean_token_accuracy": 0.7522037148475647, + "num_tokens": 125462834.0, + "step": 54280 + }, + { + "epoch": 0.4977537361327588, + "learning_rate": 0.00010045108645823784, + "loss": 0.8482, + "mean_token_accuracy": 0.7438068509101867, + "num_tokens": 125485982.0, + "step": 54290 + }, + { + "epoch": 0.497845420372238, + "learning_rate": 0.000100432749610342, + "loss": 0.8153, + "mean_token_accuracy": 0.7500245273113251, + "num_tokens": 125509648.0, + "step": 54300 + }, + { + "epoch": 0.49793710461171725, + "learning_rate": 0.00010041441276244615, + "loss": 0.8459, + "mean_token_accuracy": 0.7480392217636108, + "num_tokens": 125532751.0, + "step": 54310 + }, + { + "epoch": 0.4980287888511965, + "learning_rate": 0.00010039607591455029, + "loss": 0.8357, + "mean_token_accuracy": 0.7492863476276398, + "num_tokens": 125555742.0, + "step": 54320 + }, + { + "epoch": 0.4981204730906757, + "learning_rate": 0.00010037773906665444, + "loss": 0.8396, + "mean_token_accuracy": 0.7488640606403351, + "num_tokens": 125578749.0, + "step": 54330 + }, + { + "epoch": 0.49821215733015495, + "learning_rate": 0.00010035940221875859, + "loss": 0.8007, + "mean_token_accuracy": 0.7627981245517731, + "num_tokens": 125601938.0, + "step": 54340 + }, + { + "epoch": 0.4983038415696342, + "learning_rate": 0.00010034106537086277, + "loss": 0.8868, + "mean_token_accuracy": 0.7371641397476196, + "num_tokens": 125624452.0, + "step": 54350 + }, + { + "epoch": 0.4983955258091134, + "learning_rate": 0.00010032272852296691, + "loss": 0.8319, + "mean_token_accuracy": 0.7496842861175537, + "num_tokens": 125648034.0, + "step": 54360 + }, + { + "epoch": 0.49848721004859264, + "learning_rate": 0.00010030439167507106, + "loss": 0.8401, + "mean_token_accuracy": 0.7501612901687622, + "num_tokens": 125672256.0, + "step": 54370 + }, + { + "epoch": 0.4985788942880719, + "learning_rate": 0.00010028605482717521, + "loss": 0.8522, + "mean_token_accuracy": 0.7450436055660248, + "num_tokens": 125694924.0, + "step": 54380 + }, + { + "epoch": 0.4986705785275511, + "learning_rate": 0.00010026771797927936, + "loss": 0.8261, + "mean_token_accuracy": 0.7515852391719818, + "num_tokens": 125718388.0, + "step": 54390 + }, + { + "epoch": 0.49876226276703034, + "learning_rate": 0.00010024938113138351, + "loss": 0.8366, + "mean_token_accuracy": 0.7515949666500091, + "num_tokens": 125741631.0, + "step": 54400 + }, + { + "epoch": 0.4988539470065096, + "learning_rate": 0.00010023104428348767, + "loss": 0.8088, + "mean_token_accuracy": 0.7510480940341949, + "num_tokens": 125764628.0, + "step": 54410 + }, + { + "epoch": 0.49894563124598884, + "learning_rate": 0.00010021270743559183, + "loss": 0.8109, + "mean_token_accuracy": 0.7558558702468872, + "num_tokens": 125787253.0, + "step": 54420 + }, + { + "epoch": 0.49903731548546804, + "learning_rate": 0.00010019437058769598, + "loss": 0.8274, + "mean_token_accuracy": 0.7478065371513367, + "num_tokens": 125810156.0, + "step": 54430 + }, + { + "epoch": 0.4991289997249473, + "learning_rate": 0.00010017603373980014, + "loss": 0.8462, + "mean_token_accuracy": 0.7445954740047455, + "num_tokens": 125833313.0, + "step": 54440 + }, + { + "epoch": 0.49922068396442654, + "learning_rate": 0.00010015769689190429, + "loss": 0.8254, + "mean_token_accuracy": 0.7470640480518341, + "num_tokens": 125855964.0, + "step": 54450 + }, + { + "epoch": 0.49931236820390573, + "learning_rate": 0.00010013936004400844, + "loss": 0.8168, + "mean_token_accuracy": 0.755207484960556, + "num_tokens": 125878786.0, + "step": 54460 + }, + { + "epoch": 0.499404052443385, + "learning_rate": 0.00010012102319611258, + "loss": 0.8552, + "mean_token_accuracy": 0.7470451116561889, + "num_tokens": 125901422.0, + "step": 54470 + }, + { + "epoch": 0.49949573668286423, + "learning_rate": 0.00010010268634821676, + "loss": 0.8195, + "mean_token_accuracy": 0.7487702548503876, + "num_tokens": 125924383.0, + "step": 54480 + }, + { + "epoch": 0.49958742092234343, + "learning_rate": 0.00010008434950032091, + "loss": 0.8405, + "mean_token_accuracy": 0.7458652555942535, + "num_tokens": 125947372.0, + "step": 54490 + }, + { + "epoch": 0.4996791051618227, + "learning_rate": 0.00010006601265242506, + "loss": 0.808, + "mean_token_accuracy": 0.7584410846233368, + "num_tokens": 125970240.0, + "step": 54500 + }, + { + "epoch": 0.49977078940130193, + "learning_rate": 0.00010004767580452921, + "loss": 0.8181, + "mean_token_accuracy": 0.7533949971199035, + "num_tokens": 125993205.0, + "step": 54510 + }, + { + "epoch": 0.4998624736407811, + "learning_rate": 0.00010002933895663335, + "loss": 0.8365, + "mean_token_accuracy": 0.7492292523384094, + "num_tokens": 126016370.0, + "step": 54520 + }, + { + "epoch": 0.4999541578802604, + "learning_rate": 0.0001000110021087375, + "loss": 0.8588, + "mean_token_accuracy": 0.743920087814331, + "num_tokens": 126040237.0, + "step": 54530 + }, + { + "epoch": 0.5000458421197396, + "learning_rate": 9.999266526084167e-05, + "loss": 0.8374, + "mean_token_accuracy": 0.7522234141826629, + "num_tokens": 126063868.0, + "step": 54540 + }, + { + "epoch": 0.5001375263592188, + "learning_rate": 9.997432841294582e-05, + "loss": 0.9003, + "mean_token_accuracy": 0.7352230846881866, + "num_tokens": 126086241.0, + "step": 54550 + }, + { + "epoch": 0.5002292105986981, + "learning_rate": 9.995599156504997e-05, + "loss": 0.8216, + "mean_token_accuracy": 0.7472166180610657, + "num_tokens": 126108299.0, + "step": 54560 + }, + { + "epoch": 0.5003208948381773, + "learning_rate": 9.993765471715412e-05, + "loss": 0.8875, + "mean_token_accuracy": 0.7412724792957306, + "num_tokens": 126131054.0, + "step": 54570 + }, + { + "epoch": 0.5004125790776566, + "learning_rate": 9.991931786925828e-05, + "loss": 0.795, + "mean_token_accuracy": 0.7548500001430511, + "num_tokens": 126153660.0, + "step": 54580 + }, + { + "epoch": 0.5005042633171358, + "learning_rate": 9.990098102136243e-05, + "loss": 0.8226, + "mean_token_accuracy": 0.7520363807678223, + "num_tokens": 126176936.0, + "step": 54590 + }, + { + "epoch": 0.5005959475566151, + "learning_rate": 9.988264417346659e-05, + "loss": 0.8002, + "mean_token_accuracy": 0.7580593407154084, + "num_tokens": 126200221.0, + "step": 54600 + }, + { + "epoch": 0.5006876317960942, + "learning_rate": 9.986430732557074e-05, + "loss": 0.8076, + "mean_token_accuracy": 0.7551198363304138, + "num_tokens": 126224001.0, + "step": 54610 + }, + { + "epoch": 0.5007793160355735, + "learning_rate": 9.984597047767488e-05, + "loss": 0.8287, + "mean_token_accuracy": 0.7408681035041809, + "num_tokens": 126246677.0, + "step": 54620 + }, + { + "epoch": 0.5008710002750527, + "learning_rate": 9.982763362977905e-05, + "loss": 0.8658, + "mean_token_accuracy": 0.7422008037567138, + "num_tokens": 126269735.0, + "step": 54630 + }, + { + "epoch": 0.500962684514532, + "learning_rate": 9.98092967818832e-05, + "loss": 0.7771, + "mean_token_accuracy": 0.7584976851940155, + "num_tokens": 126292808.0, + "step": 54640 + }, + { + "epoch": 0.5010543687540112, + "learning_rate": 9.979095993398735e-05, + "loss": 0.8238, + "mean_token_accuracy": 0.7523404061794281, + "num_tokens": 126315748.0, + "step": 54650 + }, + { + "epoch": 0.5011460529934905, + "learning_rate": 9.97726230860915e-05, + "loss": 0.8015, + "mean_token_accuracy": 0.7549440562725067, + "num_tokens": 126338980.0, + "step": 54660 + }, + { + "epoch": 0.5012377372329696, + "learning_rate": 9.975428623819566e-05, + "loss": 0.8345, + "mean_token_accuracy": 0.7477507054805755, + "num_tokens": 126362205.0, + "step": 54670 + }, + { + "epoch": 0.5013294214724489, + "learning_rate": 9.973594939029981e-05, + "loss": 0.8341, + "mean_token_accuracy": 0.7542234659194946, + "num_tokens": 126385467.0, + "step": 54680 + }, + { + "epoch": 0.5014211057119281, + "learning_rate": 9.971761254240397e-05, + "loss": 0.8446, + "mean_token_accuracy": 0.7496972739696502, + "num_tokens": 126408886.0, + "step": 54690 + }, + { + "epoch": 0.5015127899514074, + "learning_rate": 9.969927569450813e-05, + "loss": 0.8107, + "mean_token_accuracy": 0.7551493108272552, + "num_tokens": 126431755.0, + "step": 54700 + }, + { + "epoch": 0.5016044741908866, + "learning_rate": 9.968093884661228e-05, + "loss": 0.8558, + "mean_token_accuracy": 0.7427143335342408, + "num_tokens": 126454755.0, + "step": 54710 + }, + { + "epoch": 0.5016961584303659, + "learning_rate": 9.966260199871642e-05, + "loss": 0.8604, + "mean_token_accuracy": 0.739615398645401, + "num_tokens": 126477920.0, + "step": 54720 + }, + { + "epoch": 0.5017878426698451, + "learning_rate": 9.964426515082058e-05, + "loss": 0.8436, + "mean_token_accuracy": 0.7475731015205384, + "num_tokens": 126501745.0, + "step": 54730 + }, + { + "epoch": 0.5018795269093242, + "learning_rate": 9.962592830292473e-05, + "loss": 0.8653, + "mean_token_accuracy": 0.7458015322685242, + "num_tokens": 126524704.0, + "step": 54740 + }, + { + "epoch": 0.5019712111488035, + "learning_rate": 9.960759145502888e-05, + "loss": 0.9123, + "mean_token_accuracy": 0.731933981180191, + "num_tokens": 126547338.0, + "step": 54750 + }, + { + "epoch": 0.5020628953882827, + "learning_rate": 9.958925460713304e-05, + "loss": 0.8152, + "mean_token_accuracy": 0.7562912046909332, + "num_tokens": 126570696.0, + "step": 54760 + }, + { + "epoch": 0.502154579627762, + "learning_rate": 9.957091775923719e-05, + "loss": 0.8748, + "mean_token_accuracy": 0.7461549878120423, + "num_tokens": 126594498.0, + "step": 54770 + }, + { + "epoch": 0.5022462638672412, + "learning_rate": 9.955258091134134e-05, + "loss": 0.8205, + "mean_token_accuracy": 0.7527951240539551, + "num_tokens": 126617710.0, + "step": 54780 + }, + { + "epoch": 0.5023379481067205, + "learning_rate": 9.95342440634455e-05, + "loss": 0.8289, + "mean_token_accuracy": 0.7487452089786529, + "num_tokens": 126641340.0, + "step": 54790 + }, + { + "epoch": 0.5024296323461996, + "learning_rate": 9.951590721554966e-05, + "loss": 0.8443, + "mean_token_accuracy": 0.7519077181816101, + "num_tokens": 126663634.0, + "step": 54800 + }, + { + "epoch": 0.5025213165856789, + "learning_rate": 9.949757036765381e-05, + "loss": 0.8628, + "mean_token_accuracy": 0.744753384590149, + "num_tokens": 126686917.0, + "step": 54810 + }, + { + "epoch": 0.5026130008251581, + "learning_rate": 9.947923351975796e-05, + "loss": 0.8132, + "mean_token_accuracy": 0.7549303352832795, + "num_tokens": 126710460.0, + "step": 54820 + }, + { + "epoch": 0.5027046850646374, + "learning_rate": 9.946089667186211e-05, + "loss": 0.8384, + "mean_token_accuracy": 0.7446047544479371, + "num_tokens": 126733935.0, + "step": 54830 + }, + { + "epoch": 0.5027963693041166, + "learning_rate": 9.944255982396626e-05, + "loss": 0.8442, + "mean_token_accuracy": 0.7540520310401917, + "num_tokens": 126756564.0, + "step": 54840 + }, + { + "epoch": 0.5028880535435959, + "learning_rate": 9.942422297607042e-05, + "loss": 0.8569, + "mean_token_accuracy": 0.743932569026947, + "num_tokens": 126780825.0, + "step": 54850 + }, + { + "epoch": 0.5029797377830751, + "learning_rate": 9.940588612817457e-05, + "loss": 0.8118, + "mean_token_accuracy": 0.7560799717903137, + "num_tokens": 126804400.0, + "step": 54860 + }, + { + "epoch": 0.5030714220225543, + "learning_rate": 9.938754928027872e-05, + "loss": 0.8321, + "mean_token_accuracy": 0.7500090837478638, + "num_tokens": 126828220.0, + "step": 54870 + }, + { + "epoch": 0.5031631062620335, + "learning_rate": 9.936921243238287e-05, + "loss": 0.8669, + "mean_token_accuracy": 0.7424058318138123, + "num_tokens": 126851194.0, + "step": 54880 + }, + { + "epoch": 0.5032547905015128, + "learning_rate": 9.935087558448704e-05, + "loss": 0.8542, + "mean_token_accuracy": 0.7454552531242371, + "num_tokens": 126874381.0, + "step": 54890 + }, + { + "epoch": 0.503346474740992, + "learning_rate": 9.933253873659119e-05, + "loss": 0.7986, + "mean_token_accuracy": 0.7588015139102936, + "num_tokens": 126897302.0, + "step": 54900 + }, + { + "epoch": 0.5034381589804713, + "learning_rate": 9.931420188869534e-05, + "loss": 0.8631, + "mean_token_accuracy": 0.7387021481990814, + "num_tokens": 126920953.0, + "step": 54910 + }, + { + "epoch": 0.5035298432199505, + "learning_rate": 9.92958650407995e-05, + "loss": 0.816, + "mean_token_accuracy": 0.7493123829364776, + "num_tokens": 126943968.0, + "step": 54920 + }, + { + "epoch": 0.5036215274594297, + "learning_rate": 9.927752819290365e-05, + "loss": 0.8326, + "mean_token_accuracy": 0.743408453464508, + "num_tokens": 126966237.0, + "step": 54930 + }, + { + "epoch": 0.5037132116989089, + "learning_rate": 9.92591913450078e-05, + "loss": 0.8511, + "mean_token_accuracy": 0.7374984502792359, + "num_tokens": 126989481.0, + "step": 54940 + }, + { + "epoch": 0.5038048959383882, + "learning_rate": 9.924085449711195e-05, + "loss": 0.7858, + "mean_token_accuracy": 0.7659353673458099, + "num_tokens": 127012831.0, + "step": 54950 + }, + { + "epoch": 0.5038965801778674, + "learning_rate": 9.92225176492161e-05, + "loss": 0.8699, + "mean_token_accuracy": 0.7392362534999848, + "num_tokens": 127036098.0, + "step": 54960 + }, + { + "epoch": 0.5039882644173467, + "learning_rate": 9.920418080132025e-05, + "loss": 0.8157, + "mean_token_accuracy": 0.7554765939712524, + "num_tokens": 127059532.0, + "step": 54970 + }, + { + "epoch": 0.5040799486568259, + "learning_rate": 9.91858439534244e-05, + "loss": 0.8554, + "mean_token_accuracy": 0.740082061290741, + "num_tokens": 127083105.0, + "step": 54980 + }, + { + "epoch": 0.5041716328963052, + "learning_rate": 9.916750710552857e-05, + "loss": 0.8639, + "mean_token_accuracy": 0.7439696490764618, + "num_tokens": 127106250.0, + "step": 54990 + }, + { + "epoch": 0.5042633171357843, + "learning_rate": 9.914917025763272e-05, + "loss": 0.8385, + "mean_token_accuracy": 0.7487026512622833, + "num_tokens": 127130489.0, + "step": 55000 + }, + { + "epoch": 0.5043550013752636, + "learning_rate": 9.913083340973687e-05, + "loss": 0.8679, + "mean_token_accuracy": 0.7465303182601929, + "num_tokens": 127153623.0, + "step": 55010 + }, + { + "epoch": 0.5044466856147428, + "learning_rate": 9.911249656184103e-05, + "loss": 0.8631, + "mean_token_accuracy": 0.7382868230342865, + "num_tokens": 127176977.0, + "step": 55020 + }, + { + "epoch": 0.5045383698542221, + "learning_rate": 9.909415971394518e-05, + "loss": 0.8424, + "mean_token_accuracy": 0.7415868818759919, + "num_tokens": 127200079.0, + "step": 55030 + }, + { + "epoch": 0.5046300540937013, + "learning_rate": 9.907582286604933e-05, + "loss": 0.8239, + "mean_token_accuracy": 0.7546780347824097, + "num_tokens": 127224392.0, + "step": 55040 + }, + { + "epoch": 0.5047217383331806, + "learning_rate": 9.90574860181535e-05, + "loss": 0.8825, + "mean_token_accuracy": 0.7388218402862549, + "num_tokens": 127247293.0, + "step": 55050 + }, + { + "epoch": 0.5048134225726597, + "learning_rate": 9.903914917025763e-05, + "loss": 0.8748, + "mean_token_accuracy": 0.741418582201004, + "num_tokens": 127271290.0, + "step": 55060 + }, + { + "epoch": 0.504905106812139, + "learning_rate": 9.902081232236178e-05, + "loss": 0.831, + "mean_token_accuracy": 0.7555666148662568, + "num_tokens": 127294268.0, + "step": 55070 + }, + { + "epoch": 0.5049967910516182, + "learning_rate": 9.900247547446594e-05, + "loss": 0.8298, + "mean_token_accuracy": 0.7488799631595612, + "num_tokens": 127317141.0, + "step": 55080 + }, + { + "epoch": 0.5050884752910975, + "learning_rate": 9.89841386265701e-05, + "loss": 0.8157, + "mean_token_accuracy": 0.7507079720497132, + "num_tokens": 127339832.0, + "step": 55090 + }, + { + "epoch": 0.5051801595305767, + "learning_rate": 9.896580177867425e-05, + "loss": 0.855, + "mean_token_accuracy": 0.7446078598499298, + "num_tokens": 127363129.0, + "step": 55100 + }, + { + "epoch": 0.505271843770056, + "learning_rate": 9.89474649307784e-05, + "loss": 0.7936, + "mean_token_accuracy": 0.7580273449420929, + "num_tokens": 127386426.0, + "step": 55110 + }, + { + "epoch": 0.5053635280095352, + "learning_rate": 9.892912808288256e-05, + "loss": 0.8335, + "mean_token_accuracy": 0.7495563566684723, + "num_tokens": 127409625.0, + "step": 55120 + }, + { + "epoch": 0.5054552122490144, + "learning_rate": 9.891079123498671e-05, + "loss": 0.8048, + "mean_token_accuracy": 0.7522223949432373, + "num_tokens": 127432061.0, + "step": 55130 + }, + { + "epoch": 0.5055468964884936, + "learning_rate": 9.889245438709086e-05, + "loss": 0.8334, + "mean_token_accuracy": 0.744785737991333, + "num_tokens": 127455714.0, + "step": 55140 + }, + { + "epoch": 0.5056385807279729, + "learning_rate": 9.887411753919503e-05, + "loss": 0.8419, + "mean_token_accuracy": 0.7535149455070496, + "num_tokens": 127478644.0, + "step": 55150 + }, + { + "epoch": 0.5057302649674521, + "learning_rate": 9.885578069129917e-05, + "loss": 0.8201, + "mean_token_accuracy": 0.7557021617889405, + "num_tokens": 127501827.0, + "step": 55160 + }, + { + "epoch": 0.5058219492069314, + "learning_rate": 9.883744384340332e-05, + "loss": 0.8542, + "mean_token_accuracy": 0.7471792221069335, + "num_tokens": 127526083.0, + "step": 55170 + }, + { + "epoch": 0.5059136334464106, + "learning_rate": 9.881910699550748e-05, + "loss": 0.8333, + "mean_token_accuracy": 0.7493178725242615, + "num_tokens": 127550299.0, + "step": 55180 + }, + { + "epoch": 0.5060053176858897, + "learning_rate": 9.880077014761163e-05, + "loss": 0.81, + "mean_token_accuracy": 0.7530982732772827, + "num_tokens": 127573181.0, + "step": 55190 + }, + { + "epoch": 0.506097001925369, + "learning_rate": 9.878243329971579e-05, + "loss": 0.8404, + "mean_token_accuracy": 0.7522773265838623, + "num_tokens": 127596723.0, + "step": 55200 + }, + { + "epoch": 0.5061886861648482, + "learning_rate": 9.876409645181994e-05, + "loss": 0.8377, + "mean_token_accuracy": 0.7426759779453278, + "num_tokens": 127620142.0, + "step": 55210 + }, + { + "epoch": 0.5062803704043275, + "learning_rate": 9.874575960392409e-05, + "loss": 0.8365, + "mean_token_accuracy": 0.7444867551326751, + "num_tokens": 127643905.0, + "step": 55220 + }, + { + "epoch": 0.5063720546438067, + "learning_rate": 9.872742275602824e-05, + "loss": 0.8287, + "mean_token_accuracy": 0.7522559106349945, + "num_tokens": 127666297.0, + "step": 55230 + }, + { + "epoch": 0.506463738883286, + "learning_rate": 9.87090859081324e-05, + "loss": 0.8852, + "mean_token_accuracy": 0.7422611057758332, + "num_tokens": 127689578.0, + "step": 55240 + }, + { + "epoch": 0.5065554231227652, + "learning_rate": 9.869074906023656e-05, + "loss": 0.8448, + "mean_token_accuracy": 0.7505880951881408, + "num_tokens": 127712282.0, + "step": 55250 + }, + { + "epoch": 0.5066471073622444, + "learning_rate": 9.86724122123407e-05, + "loss": 0.8387, + "mean_token_accuracy": 0.7525406897068023, + "num_tokens": 127735198.0, + "step": 55260 + }, + { + "epoch": 0.5067387916017236, + "learning_rate": 9.865407536444485e-05, + "loss": 0.8404, + "mean_token_accuracy": 0.7460958778858184, + "num_tokens": 127758639.0, + "step": 55270 + }, + { + "epoch": 0.5068304758412029, + "learning_rate": 9.863573851654901e-05, + "loss": 0.8362, + "mean_token_accuracy": 0.7530414164066315, + "num_tokens": 127781784.0, + "step": 55280 + }, + { + "epoch": 0.5069221600806821, + "learning_rate": 9.861740166865317e-05, + "loss": 0.8662, + "mean_token_accuracy": 0.7414700984954834, + "num_tokens": 127804452.0, + "step": 55290 + }, + { + "epoch": 0.5070138443201614, + "learning_rate": 9.859906482075732e-05, + "loss": 0.8508, + "mean_token_accuracy": 0.7503695964813233, + "num_tokens": 127827346.0, + "step": 55300 + }, + { + "epoch": 0.5071055285596406, + "learning_rate": 9.858072797286147e-05, + "loss": 0.8668, + "mean_token_accuracy": 0.7402788043022156, + "num_tokens": 127849687.0, + "step": 55310 + }, + { + "epoch": 0.5071972127991198, + "learning_rate": 9.856239112496562e-05, + "loss": 0.8159, + "mean_token_accuracy": 0.7513509571552277, + "num_tokens": 127872183.0, + "step": 55320 + }, + { + "epoch": 0.507288897038599, + "learning_rate": 9.854405427706977e-05, + "loss": 0.8247, + "mean_token_accuracy": 0.756741201877594, + "num_tokens": 127895640.0, + "step": 55330 + }, + { + "epoch": 0.5073805812780783, + "learning_rate": 9.852571742917393e-05, + "loss": 0.8245, + "mean_token_accuracy": 0.754223370552063, + "num_tokens": 127919095.0, + "step": 55340 + }, + { + "epoch": 0.5074722655175575, + "learning_rate": 9.850738058127809e-05, + "loss": 0.8002, + "mean_token_accuracy": 0.7614878475666046, + "num_tokens": 127942701.0, + "step": 55350 + }, + { + "epoch": 0.5075639497570368, + "learning_rate": 9.848904373338223e-05, + "loss": 0.8173, + "mean_token_accuracy": 0.749773132801056, + "num_tokens": 127965305.0, + "step": 55360 + }, + { + "epoch": 0.507655633996516, + "learning_rate": 9.847070688548638e-05, + "loss": 0.8757, + "mean_token_accuracy": 0.7366073966026306, + "num_tokens": 127988287.0, + "step": 55370 + }, + { + "epoch": 0.5077473182359953, + "learning_rate": 9.845237003759055e-05, + "loss": 0.831, + "mean_token_accuracy": 0.7543848633766175, + "num_tokens": 128011174.0, + "step": 55380 + }, + { + "epoch": 0.5078390024754744, + "learning_rate": 9.84340331896947e-05, + "loss": 0.8514, + "mean_token_accuracy": 0.7410233438014984, + "num_tokens": 128034072.0, + "step": 55390 + }, + { + "epoch": 0.5079306867149537, + "learning_rate": 9.841569634179885e-05, + "loss": 0.8779, + "mean_token_accuracy": 0.7453109204769135, + "num_tokens": 128057754.0, + "step": 55400 + }, + { + "epoch": 0.5080223709544329, + "learning_rate": 9.8397359493903e-05, + "loss": 0.8555, + "mean_token_accuracy": 0.7473021626472474, + "num_tokens": 128080279.0, + "step": 55410 + }, + { + "epoch": 0.5081140551939122, + "learning_rate": 9.837902264600715e-05, + "loss": 0.8355, + "mean_token_accuracy": 0.7450722455978394, + "num_tokens": 128104021.0, + "step": 55420 + }, + { + "epoch": 0.5082057394333914, + "learning_rate": 9.83606857981113e-05, + "loss": 0.7832, + "mean_token_accuracy": 0.7592859029769897, + "num_tokens": 128127786.0, + "step": 55430 + }, + { + "epoch": 0.5082974236728707, + "learning_rate": 9.834234895021546e-05, + "loss": 0.8529, + "mean_token_accuracy": 0.7397254407405853, + "num_tokens": 128150101.0, + "step": 55440 + }, + { + "epoch": 0.5083891079123498, + "learning_rate": 9.832401210231962e-05, + "loss": 0.8281, + "mean_token_accuracy": 0.7477978467941284, + "num_tokens": 128173294.0, + "step": 55450 + }, + { + "epoch": 0.5084807921518291, + "learning_rate": 9.830567525442376e-05, + "loss": 0.8327, + "mean_token_accuracy": 0.7507203817367554, + "num_tokens": 128196072.0, + "step": 55460 + }, + { + "epoch": 0.5085724763913083, + "learning_rate": 9.828733840652791e-05, + "loss": 0.8332, + "mean_token_accuracy": 0.7511986076831818, + "num_tokens": 128218837.0, + "step": 55470 + }, + { + "epoch": 0.5086641606307876, + "learning_rate": 9.826900155863208e-05, + "loss": 0.8161, + "mean_token_accuracy": 0.7469117105007171, + "num_tokens": 128241361.0, + "step": 55480 + }, + { + "epoch": 0.5087558448702668, + "learning_rate": 9.825066471073623e-05, + "loss": 0.8451, + "mean_token_accuracy": 0.7483738541603089, + "num_tokens": 128265047.0, + "step": 55490 + }, + { + "epoch": 0.5088475291097461, + "learning_rate": 9.823232786284038e-05, + "loss": 0.8965, + "mean_token_accuracy": 0.7301852464675903, + "num_tokens": 128288379.0, + "step": 55500 + }, + { + "epoch": 0.5089392133492253, + "learning_rate": 9.821399101494453e-05, + "loss": 0.8595, + "mean_token_accuracy": 0.7519036054611206, + "num_tokens": 128311210.0, + "step": 55510 + }, + { + "epoch": 0.5090308975887045, + "learning_rate": 9.819565416704869e-05, + "loss": 0.8316, + "mean_token_accuracy": 0.7539181113243103, + "num_tokens": 128333412.0, + "step": 55520 + }, + { + "epoch": 0.5091225818281837, + "learning_rate": 9.817731731915284e-05, + "loss": 0.824, + "mean_token_accuracy": 0.7523548245429993, + "num_tokens": 128355933.0, + "step": 55530 + }, + { + "epoch": 0.509214266067663, + "learning_rate": 9.8158980471257e-05, + "loss": 0.8388, + "mean_token_accuracy": 0.749217939376831, + "num_tokens": 128379533.0, + "step": 55540 + }, + { + "epoch": 0.5093059503071422, + "learning_rate": 9.814064362336116e-05, + "loss": 0.8668, + "mean_token_accuracy": 0.7430170595645904, + "num_tokens": 128402664.0, + "step": 55550 + }, + { + "epoch": 0.5093976345466215, + "learning_rate": 9.81223067754653e-05, + "loss": 0.8508, + "mean_token_accuracy": 0.743842476606369, + "num_tokens": 128425739.0, + "step": 55560 + }, + { + "epoch": 0.5094893187861007, + "learning_rate": 9.810396992756945e-05, + "loss": 0.8464, + "mean_token_accuracy": 0.7461042940616608, + "num_tokens": 128447730.0, + "step": 55570 + }, + { + "epoch": 0.5095810030255798, + "learning_rate": 9.808563307967361e-05, + "loss": 0.8227, + "mean_token_accuracy": 0.7504740059375763, + "num_tokens": 128470146.0, + "step": 55580 + }, + { + "epoch": 0.5096726872650591, + "learning_rate": 9.806729623177776e-05, + "loss": 0.8586, + "mean_token_accuracy": 0.7417598307132721, + "num_tokens": 128493164.0, + "step": 55590 + }, + { + "epoch": 0.5097643715045383, + "learning_rate": 9.804895938388192e-05, + "loss": 0.8203, + "mean_token_accuracy": 0.7573263347148895, + "num_tokens": 128516133.0, + "step": 55600 + }, + { + "epoch": 0.5098560557440176, + "learning_rate": 9.803062253598607e-05, + "loss": 0.8476, + "mean_token_accuracy": 0.7501390933990478, + "num_tokens": 128539886.0, + "step": 55610 + }, + { + "epoch": 0.5099477399834969, + "learning_rate": 9.801228568809022e-05, + "loss": 0.829, + "mean_token_accuracy": 0.7500462651252746, + "num_tokens": 128562059.0, + "step": 55620 + }, + { + "epoch": 0.5100394242229761, + "learning_rate": 9.799394884019437e-05, + "loss": 0.8409, + "mean_token_accuracy": 0.7515318751335144, + "num_tokens": 128585511.0, + "step": 55630 + }, + { + "epoch": 0.5101311084624554, + "learning_rate": 9.797561199229854e-05, + "loss": 0.881, + "mean_token_accuracy": 0.7405971586704254, + "num_tokens": 128608428.0, + "step": 55640 + }, + { + "epoch": 0.5102227927019345, + "learning_rate": 9.795727514440269e-05, + "loss": 0.8368, + "mean_token_accuracy": 0.7500964045524597, + "num_tokens": 128632418.0, + "step": 55650 + }, + { + "epoch": 0.5103144769414137, + "learning_rate": 9.793893829650683e-05, + "loss": 0.8704, + "mean_token_accuracy": 0.7406009614467621, + "num_tokens": 128655669.0, + "step": 55660 + }, + { + "epoch": 0.510406161180893, + "learning_rate": 9.792060144861099e-05, + "loss": 0.832, + "mean_token_accuracy": 0.7474497854709625, + "num_tokens": 128678512.0, + "step": 55670 + }, + { + "epoch": 0.5104978454203722, + "learning_rate": 9.790226460071514e-05, + "loss": 0.8726, + "mean_token_accuracy": 0.7440742075443267, + "num_tokens": 128701958.0, + "step": 55680 + }, + { + "epoch": 0.5105895296598515, + "learning_rate": 9.78839277528193e-05, + "loss": 0.8136, + "mean_token_accuracy": 0.757123863697052, + "num_tokens": 128725537.0, + "step": 55690 + }, + { + "epoch": 0.5106812138993307, + "learning_rate": 9.786559090492345e-05, + "loss": 0.8167, + "mean_token_accuracy": 0.7601333737373352, + "num_tokens": 128748847.0, + "step": 55700 + }, + { + "epoch": 0.5107728981388099, + "learning_rate": 9.78472540570276e-05, + "loss": 0.8316, + "mean_token_accuracy": 0.7527754962444305, + "num_tokens": 128771671.0, + "step": 55710 + }, + { + "epoch": 0.5108645823782891, + "learning_rate": 9.782891720913175e-05, + "loss": 0.819, + "mean_token_accuracy": 0.7536244928836823, + "num_tokens": 128794737.0, + "step": 55720 + }, + { + "epoch": 0.5109562666177684, + "learning_rate": 9.78105803612359e-05, + "loss": 0.8791, + "mean_token_accuracy": 0.7345493853092193, + "num_tokens": 128818320.0, + "step": 55730 + }, + { + "epoch": 0.5110479508572476, + "learning_rate": 9.779224351334007e-05, + "loss": 0.8131, + "mean_token_accuracy": 0.7515747964382171, + "num_tokens": 128841468.0, + "step": 55740 + }, + { + "epoch": 0.5111396350967269, + "learning_rate": 9.777390666544422e-05, + "loss": 0.8233, + "mean_token_accuracy": 0.7469059705734253, + "num_tokens": 128864809.0, + "step": 55750 + }, + { + "epoch": 0.5112313193362061, + "learning_rate": 9.775556981754836e-05, + "loss": 0.8099, + "mean_token_accuracy": 0.7587299227714539, + "num_tokens": 128888020.0, + "step": 55760 + }, + { + "epoch": 0.5113230035756854, + "learning_rate": 9.773723296965252e-05, + "loss": 0.8205, + "mean_token_accuracy": 0.7524077892303467, + "num_tokens": 128911578.0, + "step": 55770 + }, + { + "epoch": 0.5114146878151645, + "learning_rate": 9.771889612175668e-05, + "loss": 0.8379, + "mean_token_accuracy": 0.753923523426056, + "num_tokens": 128935301.0, + "step": 55780 + }, + { + "epoch": 0.5115063720546438, + "learning_rate": 9.770055927386083e-05, + "loss": 0.8246, + "mean_token_accuracy": 0.7583781242370605, + "num_tokens": 128958541.0, + "step": 55790 + }, + { + "epoch": 0.511598056294123, + "learning_rate": 9.7682222425965e-05, + "loss": 0.8825, + "mean_token_accuracy": 0.7409592568874359, + "num_tokens": 128981377.0, + "step": 55800 + }, + { + "epoch": 0.5116897405336023, + "learning_rate": 9.766388557806913e-05, + "loss": 0.7769, + "mean_token_accuracy": 0.7621455550193786, + "num_tokens": 129003669.0, + "step": 55810 + }, + { + "epoch": 0.5117814247730815, + "learning_rate": 9.764554873017328e-05, + "loss": 0.8672, + "mean_token_accuracy": 0.745113855600357, + "num_tokens": 129026295.0, + "step": 55820 + }, + { + "epoch": 0.5118731090125608, + "learning_rate": 9.762721188227744e-05, + "loss": 0.8218, + "mean_token_accuracy": 0.7521910727024078, + "num_tokens": 129049756.0, + "step": 55830 + }, + { + "epoch": 0.51196479325204, + "learning_rate": 9.76088750343816e-05, + "loss": 0.8182, + "mean_token_accuracy": 0.7492237269878388, + "num_tokens": 129072490.0, + "step": 55840 + }, + { + "epoch": 0.5120564774915192, + "learning_rate": 9.759053818648575e-05, + "loss": 0.836, + "mean_token_accuracy": 0.7493184745311737, + "num_tokens": 129095824.0, + "step": 55850 + }, + { + "epoch": 0.5121481617309984, + "learning_rate": 9.757220133858989e-05, + "loss": 0.848, + "mean_token_accuracy": 0.7501515507698059, + "num_tokens": 129118889.0, + "step": 55860 + }, + { + "epoch": 0.5122398459704777, + "learning_rate": 9.755386449069406e-05, + "loss": 0.8599, + "mean_token_accuracy": 0.745026308298111, + "num_tokens": 129142115.0, + "step": 55870 + }, + { + "epoch": 0.5123315302099569, + "learning_rate": 9.753552764279821e-05, + "loss": 0.8507, + "mean_token_accuracy": 0.7484850764274598, + "num_tokens": 129164757.0, + "step": 55880 + }, + { + "epoch": 0.5124232144494362, + "learning_rate": 9.751719079490236e-05, + "loss": 0.8433, + "mean_token_accuracy": 0.7456823706626892, + "num_tokens": 129187540.0, + "step": 55890 + }, + { + "epoch": 0.5125148986889154, + "learning_rate": 9.749885394700653e-05, + "loss": 0.8286, + "mean_token_accuracy": 0.7571347236633301, + "num_tokens": 129210427.0, + "step": 55900 + }, + { + "epoch": 0.5126065829283946, + "learning_rate": 9.748051709911066e-05, + "loss": 0.8518, + "mean_token_accuracy": 0.7484507083892822, + "num_tokens": 129234739.0, + "step": 55910 + }, + { + "epoch": 0.5126982671678738, + "learning_rate": 9.746218025121482e-05, + "loss": 0.8472, + "mean_token_accuracy": 0.7446218013763428, + "num_tokens": 129258461.0, + "step": 55920 + }, + { + "epoch": 0.5127899514073531, + "learning_rate": 9.744384340331898e-05, + "loss": 0.8088, + "mean_token_accuracy": 0.7495130300521851, + "num_tokens": 129281228.0, + "step": 55930 + }, + { + "epoch": 0.5128816356468323, + "learning_rate": 9.742550655542313e-05, + "loss": 0.8407, + "mean_token_accuracy": 0.7451620817184448, + "num_tokens": 129304144.0, + "step": 55940 + }, + { + "epoch": 0.5129733198863116, + "learning_rate": 9.740716970752728e-05, + "loss": 0.8748, + "mean_token_accuracy": 0.7495053827762603, + "num_tokens": 129327151.0, + "step": 55950 + }, + { + "epoch": 0.5130650041257908, + "learning_rate": 9.738883285963142e-05, + "loss": 0.8397, + "mean_token_accuracy": 0.7442684769630432, + "num_tokens": 129349965.0, + "step": 55960 + }, + { + "epoch": 0.5131566883652701, + "learning_rate": 9.737049601173559e-05, + "loss": 0.8463, + "mean_token_accuracy": 0.7464066505432129, + "num_tokens": 129372206.0, + "step": 55970 + }, + { + "epoch": 0.5132483726047492, + "learning_rate": 9.735215916383974e-05, + "loss": 0.792, + "mean_token_accuracy": 0.7607055842876435, + "num_tokens": 129395855.0, + "step": 55980 + }, + { + "epoch": 0.5133400568442285, + "learning_rate": 9.733382231594389e-05, + "loss": 0.862, + "mean_token_accuracy": 0.743760633468628, + "num_tokens": 129418954.0, + "step": 55990 + }, + { + "epoch": 0.5134317410837077, + "learning_rate": 9.731548546804806e-05, + "loss": 0.8685, + "mean_token_accuracy": 0.7486790597438813, + "num_tokens": 129441879.0, + "step": 56000 + }, + { + "epoch": 0.513523425323187, + "learning_rate": 9.72971486201522e-05, + "loss": 0.8007, + "mean_token_accuracy": 0.7590884685516357, + "num_tokens": 129465720.0, + "step": 56010 + }, + { + "epoch": 0.5136151095626662, + "learning_rate": 9.727881177225635e-05, + "loss": 0.8273, + "mean_token_accuracy": 0.74710493683815, + "num_tokens": 129489680.0, + "step": 56020 + }, + { + "epoch": 0.5137067938021455, + "learning_rate": 9.726047492436051e-05, + "loss": 0.8471, + "mean_token_accuracy": 0.7541328251361847, + "num_tokens": 129513337.0, + "step": 56030 + }, + { + "epoch": 0.5137984780416246, + "learning_rate": 9.724213807646467e-05, + "loss": 0.8607, + "mean_token_accuracy": 0.7480553388595581, + "num_tokens": 129536815.0, + "step": 56040 + }, + { + "epoch": 0.5138901622811038, + "learning_rate": 9.722380122856882e-05, + "loss": 0.8584, + "mean_token_accuracy": 0.7457198381423951, + "num_tokens": 129559278.0, + "step": 56050 + }, + { + "epoch": 0.5139818465205831, + "learning_rate": 9.720546438067296e-05, + "loss": 0.841, + "mean_token_accuracy": 0.7460310757160187, + "num_tokens": 129581530.0, + "step": 56060 + }, + { + "epoch": 0.5140735307600623, + "learning_rate": 9.718712753277712e-05, + "loss": 0.8485, + "mean_token_accuracy": 0.7485625565052032, + "num_tokens": 129604600.0, + "step": 56070 + }, + { + "epoch": 0.5141652149995416, + "learning_rate": 9.716879068488127e-05, + "loss": 0.8587, + "mean_token_accuracy": 0.7470367312431335, + "num_tokens": 129627948.0, + "step": 56080 + }, + { + "epoch": 0.5142568992390208, + "learning_rate": 9.715045383698542e-05, + "loss": 0.8491, + "mean_token_accuracy": 0.7488150477409363, + "num_tokens": 129651538.0, + "step": 56090 + }, + { + "epoch": 0.5143485834785001, + "learning_rate": 9.713211698908959e-05, + "loss": 0.8513, + "mean_token_accuracy": 0.7482627809047699, + "num_tokens": 129674323.0, + "step": 56100 + }, + { + "epoch": 0.5144402677179792, + "learning_rate": 9.711378014119373e-05, + "loss": 0.8308, + "mean_token_accuracy": 0.7516775965690613, + "num_tokens": 129696668.0, + "step": 56110 + }, + { + "epoch": 0.5145319519574585, + "learning_rate": 9.709544329329788e-05, + "loss": 0.8254, + "mean_token_accuracy": 0.7606424748897552, + "num_tokens": 129720306.0, + "step": 56120 + }, + { + "epoch": 0.5146236361969377, + "learning_rate": 9.707710644540205e-05, + "loss": 0.8582, + "mean_token_accuracy": 0.7417102813720703, + "num_tokens": 129742964.0, + "step": 56130 + }, + { + "epoch": 0.514715320436417, + "learning_rate": 9.70587695975062e-05, + "loss": 0.8562, + "mean_token_accuracy": 0.7418065547943116, + "num_tokens": 129766227.0, + "step": 56140 + }, + { + "epoch": 0.5148070046758962, + "learning_rate": 9.704043274961035e-05, + "loss": 0.876, + "mean_token_accuracy": 0.745196384191513, + "num_tokens": 129789345.0, + "step": 56150 + }, + { + "epoch": 0.5148986889153755, + "learning_rate": 9.70220959017145e-05, + "loss": 0.8416, + "mean_token_accuracy": 0.7529929518699646, + "num_tokens": 129813158.0, + "step": 56160 + }, + { + "epoch": 0.5149903731548546, + "learning_rate": 9.700375905381865e-05, + "loss": 0.8494, + "mean_token_accuracy": 0.7480137288570404, + "num_tokens": 129836146.0, + "step": 56170 + }, + { + "epoch": 0.5150820573943339, + "learning_rate": 9.69854222059228e-05, + "loss": 0.8431, + "mean_token_accuracy": 0.7475702226161957, + "num_tokens": 129859853.0, + "step": 56180 + }, + { + "epoch": 0.5151737416338131, + "learning_rate": 9.696708535802696e-05, + "loss": 0.8415, + "mean_token_accuracy": 0.7543336629867554, + "num_tokens": 129882598.0, + "step": 56190 + }, + { + "epoch": 0.5152654258732924, + "learning_rate": 9.694874851013112e-05, + "loss": 0.8129, + "mean_token_accuracy": 0.7548528909683228, + "num_tokens": 129905096.0, + "step": 56200 + }, + { + "epoch": 0.5153571101127716, + "learning_rate": 9.693041166223526e-05, + "loss": 0.7859, + "mean_token_accuracy": 0.7606727242469787, + "num_tokens": 129928093.0, + "step": 56210 + }, + { + "epoch": 0.5154487943522509, + "learning_rate": 9.691207481433941e-05, + "loss": 0.8208, + "mean_token_accuracy": 0.7520423114299775, + "num_tokens": 129951594.0, + "step": 56220 + }, + { + "epoch": 0.5155404785917301, + "learning_rate": 9.689373796644358e-05, + "loss": 0.836, + "mean_token_accuracy": 0.7486515760421752, + "num_tokens": 129974314.0, + "step": 56230 + }, + { + "epoch": 0.5156321628312093, + "learning_rate": 9.687540111854773e-05, + "loss": 0.7994, + "mean_token_accuracy": 0.7629447162151337, + "num_tokens": 129997542.0, + "step": 56240 + }, + { + "epoch": 0.5157238470706885, + "learning_rate": 9.685706427065188e-05, + "loss": 0.881, + "mean_token_accuracy": 0.7391123592853546, + "num_tokens": 130020459.0, + "step": 56250 + }, + { + "epoch": 0.5158155313101678, + "learning_rate": 9.683872742275603e-05, + "loss": 0.8586, + "mean_token_accuracy": 0.7472450077533722, + "num_tokens": 130043649.0, + "step": 56260 + }, + { + "epoch": 0.515907215549647, + "learning_rate": 9.682039057486019e-05, + "loss": 0.8366, + "mean_token_accuracy": 0.7542475044727326, + "num_tokens": 130067388.0, + "step": 56270 + }, + { + "epoch": 0.5159988997891263, + "learning_rate": 9.680205372696434e-05, + "loss": 0.8469, + "mean_token_accuracy": 0.7474272787570954, + "num_tokens": 130090318.0, + "step": 56280 + }, + { + "epoch": 0.5160905840286055, + "learning_rate": 9.67837168790685e-05, + "loss": 0.8452, + "mean_token_accuracy": 0.7500754296779633, + "num_tokens": 130113308.0, + "step": 56290 + }, + { + "epoch": 0.5161822682680847, + "learning_rate": 9.676538003117265e-05, + "loss": 0.8895, + "mean_token_accuracy": 0.7304994821548462, + "num_tokens": 130136726.0, + "step": 56300 + }, + { + "epoch": 0.5162739525075639, + "learning_rate": 9.674704318327679e-05, + "loss": 0.8225, + "mean_token_accuracy": 0.7477835178375244, + "num_tokens": 130159769.0, + "step": 56310 + }, + { + "epoch": 0.5163656367470432, + "learning_rate": 9.672870633538094e-05, + "loss": 0.8408, + "mean_token_accuracy": 0.743791788816452, + "num_tokens": 130182757.0, + "step": 56320 + }, + { + "epoch": 0.5164573209865224, + "learning_rate": 9.671036948748511e-05, + "loss": 0.8262, + "mean_token_accuracy": 0.7528278768062592, + "num_tokens": 130206495.0, + "step": 56330 + }, + { + "epoch": 0.5165490052260017, + "learning_rate": 9.669203263958926e-05, + "loss": 0.8291, + "mean_token_accuracy": 0.7492689609527587, + "num_tokens": 130229215.0, + "step": 56340 + }, + { + "epoch": 0.5166406894654809, + "learning_rate": 9.667369579169341e-05, + "loss": 0.8245, + "mean_token_accuracy": 0.7553637564182282, + "num_tokens": 130252431.0, + "step": 56350 + }, + { + "epoch": 0.5167323737049602, + "learning_rate": 9.665535894379757e-05, + "loss": 0.871, + "mean_token_accuracy": 0.7451859712600708, + "num_tokens": 130275970.0, + "step": 56360 + }, + { + "epoch": 0.5168240579444393, + "learning_rate": 9.663702209590172e-05, + "loss": 0.8074, + "mean_token_accuracy": 0.7540444791316986, + "num_tokens": 130299393.0, + "step": 56370 + }, + { + "epoch": 0.5169157421839186, + "learning_rate": 9.661868524800587e-05, + "loss": 0.8422, + "mean_token_accuracy": 0.7524396538734436, + "num_tokens": 130322460.0, + "step": 56380 + }, + { + "epoch": 0.5170074264233978, + "learning_rate": 9.660034840011003e-05, + "loss": 0.8684, + "mean_token_accuracy": 0.7433933138847351, + "num_tokens": 130345701.0, + "step": 56390 + }, + { + "epoch": 0.5170991106628771, + "learning_rate": 9.658201155221419e-05, + "loss": 0.8552, + "mean_token_accuracy": 0.7409780025482178, + "num_tokens": 130369050.0, + "step": 56400 + }, + { + "epoch": 0.5171907949023563, + "learning_rate": 9.656367470431832e-05, + "loss": 0.85, + "mean_token_accuracy": 0.7443040788173676, + "num_tokens": 130392154.0, + "step": 56410 + }, + { + "epoch": 0.5172824791418356, + "learning_rate": 9.654533785642249e-05, + "loss": 0.8315, + "mean_token_accuracy": 0.752303522825241, + "num_tokens": 130414408.0, + "step": 56420 + }, + { + "epoch": 0.5173741633813147, + "learning_rate": 9.652700100852664e-05, + "loss": 0.8612, + "mean_token_accuracy": 0.7437770307064057, + "num_tokens": 130436886.0, + "step": 56430 + }, + { + "epoch": 0.517465847620794, + "learning_rate": 9.65086641606308e-05, + "loss": 0.8502, + "mean_token_accuracy": 0.7493125796318054, + "num_tokens": 130459919.0, + "step": 56440 + }, + { + "epoch": 0.5175575318602732, + "learning_rate": 9.649032731273495e-05, + "loss": 0.8256, + "mean_token_accuracy": 0.7514883935451507, + "num_tokens": 130483189.0, + "step": 56450 + }, + { + "epoch": 0.5176492160997525, + "learning_rate": 9.64719904648391e-05, + "loss": 0.8247, + "mean_token_accuracy": 0.7569907665252685, + "num_tokens": 130505681.0, + "step": 56460 + }, + { + "epoch": 0.5177409003392317, + "learning_rate": 9.645365361694325e-05, + "loss": 0.7985, + "mean_token_accuracy": 0.7550045609474182, + "num_tokens": 130528841.0, + "step": 56470 + }, + { + "epoch": 0.517832584578711, + "learning_rate": 9.64353167690474e-05, + "loss": 0.8332, + "mean_token_accuracy": 0.7549361646175384, + "num_tokens": 130552409.0, + "step": 56480 + }, + { + "epoch": 0.5179242688181902, + "learning_rate": 9.641697992115157e-05, + "loss": 0.8145, + "mean_token_accuracy": 0.758808434009552, + "num_tokens": 130575061.0, + "step": 56490 + }, + { + "epoch": 0.5180159530576693, + "learning_rate": 9.639864307325572e-05, + "loss": 0.8206, + "mean_token_accuracy": 0.7493482887744903, + "num_tokens": 130598765.0, + "step": 56500 + }, + { + "epoch": 0.5181076372971486, + "learning_rate": 9.638030622535986e-05, + "loss": 0.8625, + "mean_token_accuracy": 0.7403877735137939, + "num_tokens": 130622746.0, + "step": 56510 + }, + { + "epoch": 0.5181993215366278, + "learning_rate": 9.636196937746402e-05, + "loss": 0.8264, + "mean_token_accuracy": 0.7492237091064453, + "num_tokens": 130645671.0, + "step": 56520 + }, + { + "epoch": 0.5182910057761071, + "learning_rate": 9.634363252956817e-05, + "loss": 0.8388, + "mean_token_accuracy": 0.7474077999591827, + "num_tokens": 130668535.0, + "step": 56530 + }, + { + "epoch": 0.5183826900155863, + "learning_rate": 9.632529568167233e-05, + "loss": 0.8397, + "mean_token_accuracy": 0.7496312081813812, + "num_tokens": 130691741.0, + "step": 56540 + }, + { + "epoch": 0.5184743742550656, + "learning_rate": 9.630695883377648e-05, + "loss": 0.8177, + "mean_token_accuracy": 0.7515130519866944, + "num_tokens": 130714872.0, + "step": 56550 + }, + { + "epoch": 0.5185660584945447, + "learning_rate": 9.628862198588063e-05, + "loss": 0.8172, + "mean_token_accuracy": 0.7503711342811584, + "num_tokens": 130737646.0, + "step": 56560 + }, + { + "epoch": 0.518657742734024, + "learning_rate": 9.627028513798478e-05, + "loss": 0.8013, + "mean_token_accuracy": 0.7572340548038483, + "num_tokens": 130760567.0, + "step": 56570 + }, + { + "epoch": 0.5187494269735032, + "learning_rate": 9.625194829008893e-05, + "loss": 0.8347, + "mean_token_accuracy": 0.7530829191207886, + "num_tokens": 130783564.0, + "step": 56580 + }, + { + "epoch": 0.5188411112129825, + "learning_rate": 9.62336114421931e-05, + "loss": 0.8625, + "mean_token_accuracy": 0.7468912541866303, + "num_tokens": 130806111.0, + "step": 56590 + }, + { + "epoch": 0.5189327954524617, + "learning_rate": 9.621527459429725e-05, + "loss": 0.8209, + "mean_token_accuracy": 0.7515967309474945, + "num_tokens": 130829362.0, + "step": 56600 + }, + { + "epoch": 0.519024479691941, + "learning_rate": 9.619693774640139e-05, + "loss": 0.8133, + "mean_token_accuracy": 0.7559102058410645, + "num_tokens": 130852671.0, + "step": 56610 + }, + { + "epoch": 0.5191161639314202, + "learning_rate": 9.617860089850555e-05, + "loss": 0.862, + "mean_token_accuracy": 0.7443732738494873, + "num_tokens": 130875717.0, + "step": 56620 + }, + { + "epoch": 0.5192078481708994, + "learning_rate": 9.61602640506097e-05, + "loss": 0.8813, + "mean_token_accuracy": 0.7381378471851349, + "num_tokens": 130898979.0, + "step": 56630 + }, + { + "epoch": 0.5192995324103786, + "learning_rate": 9.614192720271386e-05, + "loss": 0.8489, + "mean_token_accuracy": 0.742695790529251, + "num_tokens": 130922449.0, + "step": 56640 + }, + { + "epoch": 0.5193912166498579, + "learning_rate": 9.612359035481801e-05, + "loss": 0.8137, + "mean_token_accuracy": 0.7539062261581421, + "num_tokens": 130944965.0, + "step": 56650 + }, + { + "epoch": 0.5194829008893371, + "learning_rate": 9.610525350692216e-05, + "loss": 0.8681, + "mean_token_accuracy": 0.7439112007617951, + "num_tokens": 130968046.0, + "step": 56660 + }, + { + "epoch": 0.5195745851288164, + "learning_rate": 9.608691665902631e-05, + "loss": 0.8179, + "mean_token_accuracy": 0.7543026506900787, + "num_tokens": 130991273.0, + "step": 56670 + }, + { + "epoch": 0.5196662693682956, + "learning_rate": 9.606857981113047e-05, + "loss": 0.8213, + "mean_token_accuracy": 0.7530774056911469, + "num_tokens": 131015586.0, + "step": 56680 + }, + { + "epoch": 0.5197579536077748, + "learning_rate": 9.605024296323463e-05, + "loss": 0.8061, + "mean_token_accuracy": 0.7528681635856629, + "num_tokens": 131038648.0, + "step": 56690 + }, + { + "epoch": 0.519849637847254, + "learning_rate": 9.603190611533878e-05, + "loss": 0.8134, + "mean_token_accuracy": 0.7553314149379731, + "num_tokens": 131061932.0, + "step": 56700 + }, + { + "epoch": 0.5199413220867333, + "learning_rate": 9.601356926744292e-05, + "loss": 0.8223, + "mean_token_accuracy": 0.7534793615341187, + "num_tokens": 131084572.0, + "step": 56710 + }, + { + "epoch": 0.5200330063262125, + "learning_rate": 9.599523241954709e-05, + "loss": 0.8142, + "mean_token_accuracy": 0.7502929627895355, + "num_tokens": 131107331.0, + "step": 56720 + }, + { + "epoch": 0.5201246905656918, + "learning_rate": 9.597689557165124e-05, + "loss": 0.8519, + "mean_token_accuracy": 0.7471710503101349, + "num_tokens": 131130301.0, + "step": 56730 + }, + { + "epoch": 0.520216374805171, + "learning_rate": 9.595855872375539e-05, + "loss": 0.8415, + "mean_token_accuracy": 0.7527761101722718, + "num_tokens": 131153232.0, + "step": 56740 + }, + { + "epoch": 0.5203080590446503, + "learning_rate": 9.594022187585954e-05, + "loss": 0.811, + "mean_token_accuracy": 0.7562039017677307, + "num_tokens": 131176569.0, + "step": 56750 + }, + { + "epoch": 0.5203997432841294, + "learning_rate": 9.59218850279637e-05, + "loss": 0.8489, + "mean_token_accuracy": 0.7481797993183136, + "num_tokens": 131199560.0, + "step": 56760 + }, + { + "epoch": 0.5204914275236087, + "learning_rate": 9.590354818006785e-05, + "loss": 0.8292, + "mean_token_accuracy": 0.7534015774726868, + "num_tokens": 131222235.0, + "step": 56770 + }, + { + "epoch": 0.5205831117630879, + "learning_rate": 9.588521133217201e-05, + "loss": 0.7896, + "mean_token_accuracy": 0.761231142282486, + "num_tokens": 131244707.0, + "step": 56780 + }, + { + "epoch": 0.5206747960025672, + "learning_rate": 9.586687448427616e-05, + "loss": 0.8674, + "mean_token_accuracy": 0.7412490248680115, + "num_tokens": 131267957.0, + "step": 56790 + }, + { + "epoch": 0.5207664802420464, + "learning_rate": 9.584853763638032e-05, + "loss": 0.8433, + "mean_token_accuracy": 0.7470519006252289, + "num_tokens": 131290722.0, + "step": 56800 + }, + { + "epoch": 0.5208581644815257, + "learning_rate": 9.583020078848445e-05, + "loss": 0.8579, + "mean_token_accuracy": 0.7428442060947418, + "num_tokens": 131314094.0, + "step": 56810 + }, + { + "epoch": 0.5209498487210048, + "learning_rate": 9.581186394058862e-05, + "loss": 0.8172, + "mean_token_accuracy": 0.7486804187297821, + "num_tokens": 131337454.0, + "step": 56820 + }, + { + "epoch": 0.521041532960484, + "learning_rate": 9.579352709269277e-05, + "loss": 0.8326, + "mean_token_accuracy": 0.7509289622306824, + "num_tokens": 131360423.0, + "step": 56830 + }, + { + "epoch": 0.5211332171999633, + "learning_rate": 9.577519024479692e-05, + "loss": 0.8558, + "mean_token_accuracy": 0.743102389574051, + "num_tokens": 131383916.0, + "step": 56840 + }, + { + "epoch": 0.5212249014394426, + "learning_rate": 9.575685339690107e-05, + "loss": 0.8542, + "mean_token_accuracy": 0.7442952692508698, + "num_tokens": 131407662.0, + "step": 56850 + }, + { + "epoch": 0.5213165856789218, + "learning_rate": 9.573851654900523e-05, + "loss": 0.8257, + "mean_token_accuracy": 0.7501402974128724, + "num_tokens": 131430601.0, + "step": 56860 + }, + { + "epoch": 0.5214082699184011, + "learning_rate": 9.572017970110938e-05, + "loss": 0.8251, + "mean_token_accuracy": 0.7523505985736847, + "num_tokens": 131453829.0, + "step": 56870 + }, + { + "epoch": 0.5214999541578803, + "learning_rate": 9.570184285321354e-05, + "loss": 0.804, + "mean_token_accuracy": 0.7546593546867371, + "num_tokens": 131477027.0, + "step": 56880 + }, + { + "epoch": 0.5215916383973594, + "learning_rate": 9.56835060053177e-05, + "loss": 0.8258, + "mean_token_accuracy": 0.7541169285774231, + "num_tokens": 131500478.0, + "step": 56890 + }, + { + "epoch": 0.5216833226368387, + "learning_rate": 9.566516915742185e-05, + "loss": 0.8466, + "mean_token_accuracy": 0.7427525162696839, + "num_tokens": 131523953.0, + "step": 56900 + }, + { + "epoch": 0.521775006876318, + "learning_rate": 9.5646832309526e-05, + "loss": 0.8428, + "mean_token_accuracy": 0.742903733253479, + "num_tokens": 131547167.0, + "step": 56910 + }, + { + "epoch": 0.5218666911157972, + "learning_rate": 9.562849546163015e-05, + "loss": 0.8455, + "mean_token_accuracy": 0.7451618432998657, + "num_tokens": 131570197.0, + "step": 56920 + }, + { + "epoch": 0.5219583753552764, + "learning_rate": 9.56101586137343e-05, + "loss": 0.8208, + "mean_token_accuracy": 0.7520460546016693, + "num_tokens": 131594129.0, + "step": 56930 + }, + { + "epoch": 0.5220500595947557, + "learning_rate": 9.559182176583846e-05, + "loss": 0.8475, + "mean_token_accuracy": 0.7443790912628174, + "num_tokens": 131616888.0, + "step": 56940 + }, + { + "epoch": 0.522141743834235, + "learning_rate": 9.557348491794261e-05, + "loss": 0.8314, + "mean_token_accuracy": 0.7462843596935272, + "num_tokens": 131639627.0, + "step": 56950 + }, + { + "epoch": 0.5222334280737141, + "learning_rate": 9.555514807004676e-05, + "loss": 0.8737, + "mean_token_accuracy": 0.7411675214767456, + "num_tokens": 131662072.0, + "step": 56960 + }, + { + "epoch": 0.5223251123131933, + "learning_rate": 9.553681122215091e-05, + "loss": 0.851, + "mean_token_accuracy": 0.745289546251297, + "num_tokens": 131685280.0, + "step": 56970 + }, + { + "epoch": 0.5224167965526726, + "learning_rate": 9.551847437425508e-05, + "loss": 0.8357, + "mean_token_accuracy": 0.7507482826709747, + "num_tokens": 131708358.0, + "step": 56980 + }, + { + "epoch": 0.5225084807921518, + "learning_rate": 9.550013752635923e-05, + "loss": 0.8474, + "mean_token_accuracy": 0.7514139413833618, + "num_tokens": 131732494.0, + "step": 56990 + }, + { + "epoch": 0.5226001650316311, + "learning_rate": 9.548180067846338e-05, + "loss": 0.8186, + "mean_token_accuracy": 0.7497166395187378, + "num_tokens": 131755048.0, + "step": 57000 + }, + { + "epoch": 0.5226918492711103, + "learning_rate": 9.546346383056753e-05, + "loss": 0.8433, + "mean_token_accuracy": 0.7481898128986358, + "num_tokens": 131778522.0, + "step": 57010 + }, + { + "epoch": 0.5227835335105895, + "learning_rate": 9.544512698267168e-05, + "loss": 0.8311, + "mean_token_accuracy": 0.7491007447242737, + "num_tokens": 131801658.0, + "step": 57020 + }, + { + "epoch": 0.5228752177500687, + "learning_rate": 9.542679013477584e-05, + "loss": 0.8458, + "mean_token_accuracy": 0.7505529463291168, + "num_tokens": 131824486.0, + "step": 57030 + }, + { + "epoch": 0.522966901989548, + "learning_rate": 9.540845328688e-05, + "loss": 0.7944, + "mean_token_accuracy": 0.7576842725276947, + "num_tokens": 131847717.0, + "step": 57040 + }, + { + "epoch": 0.5230585862290272, + "learning_rate": 9.539011643898414e-05, + "loss": 0.8911, + "mean_token_accuracy": 0.7397165119647979, + "num_tokens": 131871073.0, + "step": 57050 + }, + { + "epoch": 0.5231502704685065, + "learning_rate": 9.537177959108829e-05, + "loss": 0.8399, + "mean_token_accuracy": 0.7458792924880981, + "num_tokens": 131893726.0, + "step": 57060 + }, + { + "epoch": 0.5232419547079857, + "learning_rate": 9.535344274319244e-05, + "loss": 0.8409, + "mean_token_accuracy": 0.7471013247966767, + "num_tokens": 131917471.0, + "step": 57070 + }, + { + "epoch": 0.523333638947465, + "learning_rate": 9.533510589529661e-05, + "loss": 0.8717, + "mean_token_accuracy": 0.7374906480312348, + "num_tokens": 131940815.0, + "step": 57080 + }, + { + "epoch": 0.5234253231869441, + "learning_rate": 9.531676904740076e-05, + "loss": 0.8446, + "mean_token_accuracy": 0.7464725852012635, + "num_tokens": 131964724.0, + "step": 57090 + }, + { + "epoch": 0.5235170074264234, + "learning_rate": 9.529843219950491e-05, + "loss": 0.8448, + "mean_token_accuracy": 0.741492235660553, + "num_tokens": 131987976.0, + "step": 57100 + }, + { + "epoch": 0.5236086916659026, + "learning_rate": 9.528009535160906e-05, + "loss": 0.8083, + "mean_token_accuracy": 0.758763724565506, + "num_tokens": 132011836.0, + "step": 57110 + }, + { + "epoch": 0.5237003759053819, + "learning_rate": 9.526175850371322e-05, + "loss": 0.8292, + "mean_token_accuracy": 0.7485464990139008, + "num_tokens": 132034853.0, + "step": 57120 + }, + { + "epoch": 0.5237920601448611, + "learning_rate": 9.524342165581737e-05, + "loss": 0.8593, + "mean_token_accuracy": 0.7454329550266265, + "num_tokens": 132058644.0, + "step": 57130 + }, + { + "epoch": 0.5238837443843404, + "learning_rate": 9.522508480792153e-05, + "loss": 0.8604, + "mean_token_accuracy": 0.7422268509864807, + "num_tokens": 132081896.0, + "step": 57140 + }, + { + "epoch": 0.5239754286238195, + "learning_rate": 9.520674796002567e-05, + "loss": 0.8561, + "mean_token_accuracy": 0.7491759121417999, + "num_tokens": 132105666.0, + "step": 57150 + }, + { + "epoch": 0.5240671128632988, + "learning_rate": 9.518841111212982e-05, + "loss": 0.8618, + "mean_token_accuracy": 0.7442149877548218, + "num_tokens": 132128795.0, + "step": 57160 + }, + { + "epoch": 0.524158797102778, + "learning_rate": 9.517007426423399e-05, + "loss": 0.8123, + "mean_token_accuracy": 0.7535880506038666, + "num_tokens": 132152913.0, + "step": 57170 + }, + { + "epoch": 0.5242504813422573, + "learning_rate": 9.515173741633814e-05, + "loss": 0.8256, + "mean_token_accuracy": 0.7542143046855927, + "num_tokens": 132176758.0, + "step": 57180 + }, + { + "epoch": 0.5243421655817365, + "learning_rate": 9.513340056844229e-05, + "loss": 0.8217, + "mean_token_accuracy": 0.7579224288463593, + "num_tokens": 132199520.0, + "step": 57190 + }, + { + "epoch": 0.5244338498212158, + "learning_rate": 9.511506372054644e-05, + "loss": 0.8376, + "mean_token_accuracy": 0.7474627912044525, + "num_tokens": 132223405.0, + "step": 57200 + }, + { + "epoch": 0.524525534060695, + "learning_rate": 9.50967268726506e-05, + "loss": 0.8274, + "mean_token_accuracy": 0.7523048102855683, + "num_tokens": 132246499.0, + "step": 57210 + }, + { + "epoch": 0.5246172183001742, + "learning_rate": 9.507839002475475e-05, + "loss": 0.8278, + "mean_token_accuracy": 0.7563997805118561, + "num_tokens": 132270309.0, + "step": 57220 + }, + { + "epoch": 0.5247089025396534, + "learning_rate": 9.50600531768589e-05, + "loss": 0.812, + "mean_token_accuracy": 0.7527232706546784, + "num_tokens": 132293903.0, + "step": 57230 + }, + { + "epoch": 0.5248005867791327, + "learning_rate": 9.504171632896307e-05, + "loss": 0.8095, + "mean_token_accuracy": 0.7493672370910645, + "num_tokens": 132317030.0, + "step": 57240 + }, + { + "epoch": 0.5248922710186119, + "learning_rate": 9.50233794810672e-05, + "loss": 0.8288, + "mean_token_accuracy": 0.7502146303653717, + "num_tokens": 132340928.0, + "step": 57250 + }, + { + "epoch": 0.5249839552580912, + "learning_rate": 9.500504263317136e-05, + "loss": 0.8286, + "mean_token_accuracy": 0.7479620635509491, + "num_tokens": 132364758.0, + "step": 57260 + }, + { + "epoch": 0.5250756394975704, + "learning_rate": 9.498670578527552e-05, + "loss": 0.873, + "mean_token_accuracy": 0.7462909758090973, + "num_tokens": 132388386.0, + "step": 57270 + }, + { + "epoch": 0.5251673237370496, + "learning_rate": 9.496836893737967e-05, + "loss": 0.8087, + "mean_token_accuracy": 0.7573596954345703, + "num_tokens": 132412261.0, + "step": 57280 + }, + { + "epoch": 0.5252590079765288, + "learning_rate": 9.495003208948382e-05, + "loss": 0.8446, + "mean_token_accuracy": 0.7508314967155456, + "num_tokens": 132435035.0, + "step": 57290 + }, + { + "epoch": 0.525350692216008, + "learning_rate": 9.493169524158798e-05, + "loss": 0.8335, + "mean_token_accuracy": 0.7515981912612915, + "num_tokens": 132458573.0, + "step": 57300 + }, + { + "epoch": 0.5254423764554873, + "learning_rate": 9.491335839369213e-05, + "loss": 0.8131, + "mean_token_accuracy": 0.7545001804828644, + "num_tokens": 132481783.0, + "step": 57310 + }, + { + "epoch": 0.5255340606949666, + "learning_rate": 9.489502154579628e-05, + "loss": 0.8037, + "mean_token_accuracy": 0.756865781545639, + "num_tokens": 132505196.0, + "step": 57320 + }, + { + "epoch": 0.5256257449344458, + "learning_rate": 9.487668469790043e-05, + "loss": 0.8196, + "mean_token_accuracy": 0.7529776632785797, + "num_tokens": 132529169.0, + "step": 57330 + }, + { + "epoch": 0.525717429173925, + "learning_rate": 9.48583478500046e-05, + "loss": 0.8247, + "mean_token_accuracy": 0.7593657732009887, + "num_tokens": 132552626.0, + "step": 57340 + }, + { + "epoch": 0.5258091134134042, + "learning_rate": 9.484001100210874e-05, + "loss": 0.8315, + "mean_token_accuracy": 0.7545748353004456, + "num_tokens": 132576850.0, + "step": 57350 + }, + { + "epoch": 0.5259007976528834, + "learning_rate": 9.482167415421289e-05, + "loss": 0.7969, + "mean_token_accuracy": 0.7564575612545014, + "num_tokens": 132601601.0, + "step": 57360 + }, + { + "epoch": 0.5259924818923627, + "learning_rate": 9.480333730631705e-05, + "loss": 0.8186, + "mean_token_accuracy": 0.7548130989074707, + "num_tokens": 132625568.0, + "step": 57370 + }, + { + "epoch": 0.526084166131842, + "learning_rate": 9.47850004584212e-05, + "loss": 0.8422, + "mean_token_accuracy": 0.7476212620735169, + "num_tokens": 132649507.0, + "step": 57380 + }, + { + "epoch": 0.5261758503713212, + "learning_rate": 9.476666361052536e-05, + "loss": 0.8363, + "mean_token_accuracy": 0.7549296379089355, + "num_tokens": 132672725.0, + "step": 57390 + }, + { + "epoch": 0.5262675346108004, + "learning_rate": 9.474832676262951e-05, + "loss": 0.8237, + "mean_token_accuracy": 0.7542741537094116, + "num_tokens": 132696060.0, + "step": 57400 + }, + { + "epoch": 0.5263592188502796, + "learning_rate": 9.472998991473366e-05, + "loss": 0.8367, + "mean_token_accuracy": 0.7523957431316376, + "num_tokens": 132719765.0, + "step": 57410 + }, + { + "epoch": 0.5264509030897588, + "learning_rate": 9.471165306683781e-05, + "loss": 0.8058, + "mean_token_accuracy": 0.755360621213913, + "num_tokens": 132743859.0, + "step": 57420 + }, + { + "epoch": 0.5265425873292381, + "learning_rate": 9.469331621894196e-05, + "loss": 0.8484, + "mean_token_accuracy": 0.7548549771308899, + "num_tokens": 132766432.0, + "step": 57430 + }, + { + "epoch": 0.5266342715687173, + "learning_rate": 9.467497937104613e-05, + "loss": 0.8446, + "mean_token_accuracy": 0.7448384761810303, + "num_tokens": 132789432.0, + "step": 57440 + }, + { + "epoch": 0.5267259558081966, + "learning_rate": 9.465664252315027e-05, + "loss": 0.7871, + "mean_token_accuracy": 0.7622412264347076, + "num_tokens": 132813301.0, + "step": 57450 + }, + { + "epoch": 0.5268176400476758, + "learning_rate": 9.463830567525442e-05, + "loss": 0.8309, + "mean_token_accuracy": 0.750828206539154, + "num_tokens": 132836450.0, + "step": 57460 + }, + { + "epoch": 0.5269093242871551, + "learning_rate": 9.461996882735859e-05, + "loss": 0.8423, + "mean_token_accuracy": 0.7530226111412048, + "num_tokens": 132859850.0, + "step": 57470 + }, + { + "epoch": 0.5270010085266342, + "learning_rate": 9.460163197946274e-05, + "loss": 0.8388, + "mean_token_accuracy": 0.7607247173786164, + "num_tokens": 132883759.0, + "step": 57480 + }, + { + "epoch": 0.5270926927661135, + "learning_rate": 9.458329513156689e-05, + "loss": 0.8297, + "mean_token_accuracy": 0.752485191822052, + "num_tokens": 132907839.0, + "step": 57490 + }, + { + "epoch": 0.5271843770055927, + "learning_rate": 9.456495828367104e-05, + "loss": 0.8071, + "mean_token_accuracy": 0.7524581611156463, + "num_tokens": 132931824.0, + "step": 57500 + }, + { + "epoch": 0.527276061245072, + "learning_rate": 9.454662143577519e-05, + "loss": 0.8011, + "mean_token_accuracy": 0.7583715319633484, + "num_tokens": 132955307.0, + "step": 57510 + }, + { + "epoch": 0.5273677454845512, + "learning_rate": 9.452828458787934e-05, + "loss": 0.8086, + "mean_token_accuracy": 0.7547164380550384, + "num_tokens": 132978556.0, + "step": 57520 + }, + { + "epoch": 0.5274594297240305, + "learning_rate": 9.450994773998351e-05, + "loss": 0.8672, + "mean_token_accuracy": 0.7438210904598236, + "num_tokens": 133001261.0, + "step": 57530 + }, + { + "epoch": 0.5275511139635096, + "learning_rate": 9.449161089208766e-05, + "loss": 0.8208, + "mean_token_accuracy": 0.7512878775596619, + "num_tokens": 133025584.0, + "step": 57540 + }, + { + "epoch": 0.5276427982029889, + "learning_rate": 9.44732740441918e-05, + "loss": 0.8079, + "mean_token_accuracy": 0.7574107646942139, + "num_tokens": 133048385.0, + "step": 57550 + }, + { + "epoch": 0.5277344824424681, + "learning_rate": 9.445493719629595e-05, + "loss": 0.8154, + "mean_token_accuracy": 0.7554541051387786, + "num_tokens": 133072294.0, + "step": 57560 + }, + { + "epoch": 0.5278261666819474, + "learning_rate": 9.443660034840012e-05, + "loss": 0.7628, + "mean_token_accuracy": 0.7651211798191071, + "num_tokens": 133095880.0, + "step": 57570 + }, + { + "epoch": 0.5279178509214266, + "learning_rate": 9.441826350050427e-05, + "loss": 0.8231, + "mean_token_accuracy": 0.7492182612419128, + "num_tokens": 133120385.0, + "step": 57580 + }, + { + "epoch": 0.5280095351609059, + "learning_rate": 9.439992665260842e-05, + "loss": 0.7875, + "mean_token_accuracy": 0.7622422754764557, + "num_tokens": 133144058.0, + "step": 57590 + }, + { + "epoch": 0.5281012194003851, + "learning_rate": 9.438158980471257e-05, + "loss": 0.7835, + "mean_token_accuracy": 0.7637467741966247, + "num_tokens": 133167657.0, + "step": 57600 + }, + { + "epoch": 0.5281929036398643, + "learning_rate": 9.436325295681673e-05, + "loss": 0.8643, + "mean_token_accuracy": 0.7401656031608581, + "num_tokens": 133192252.0, + "step": 57610 + }, + { + "epoch": 0.5282845878793435, + "learning_rate": 9.434491610892088e-05, + "loss": 0.8026, + "mean_token_accuracy": 0.756588363647461, + "num_tokens": 133216402.0, + "step": 57620 + }, + { + "epoch": 0.5283762721188228, + "learning_rate": 9.432657926102504e-05, + "loss": 0.7983, + "mean_token_accuracy": 0.763013631105423, + "num_tokens": 133239776.0, + "step": 57630 + }, + { + "epoch": 0.528467956358302, + "learning_rate": 9.43082424131292e-05, + "loss": 0.8524, + "mean_token_accuracy": 0.7439938604831695, + "num_tokens": 133262456.0, + "step": 57640 + }, + { + "epoch": 0.5285596405977813, + "learning_rate": 9.428990556523333e-05, + "loss": 0.7994, + "mean_token_accuracy": 0.7561735332012176, + "num_tokens": 133285602.0, + "step": 57650 + }, + { + "epoch": 0.5286513248372605, + "learning_rate": 9.42715687173375e-05, + "loss": 0.7467, + "mean_token_accuracy": 0.7689444124698639, + "num_tokens": 133309649.0, + "step": 57660 + }, + { + "epoch": 0.5287430090767397, + "learning_rate": 9.425323186944165e-05, + "loss": 0.7982, + "mean_token_accuracy": 0.7575224041938782, + "num_tokens": 133333004.0, + "step": 57670 + }, + { + "epoch": 0.5288346933162189, + "learning_rate": 9.42348950215458e-05, + "loss": 0.8724, + "mean_token_accuracy": 0.7395725250244141, + "num_tokens": 133356516.0, + "step": 57680 + }, + { + "epoch": 0.5289263775556982, + "learning_rate": 9.421655817364995e-05, + "loss": 0.8069, + "mean_token_accuracy": 0.7581106424331665, + "num_tokens": 133381215.0, + "step": 57690 + }, + { + "epoch": 0.5290180617951774, + "learning_rate": 9.41982213257541e-05, + "loss": 0.805, + "mean_token_accuracy": 0.7568289577960968, + "num_tokens": 133405564.0, + "step": 57700 + }, + { + "epoch": 0.5291097460346567, + "learning_rate": 9.417988447785826e-05, + "loss": 0.8248, + "mean_token_accuracy": 0.7545980334281921, + "num_tokens": 133427933.0, + "step": 57710 + }, + { + "epoch": 0.5292014302741359, + "learning_rate": 9.416154762996241e-05, + "loss": 0.8056, + "mean_token_accuracy": 0.7599722623825074, + "num_tokens": 133451518.0, + "step": 57720 + }, + { + "epoch": 0.5292931145136152, + "learning_rate": 9.414321078206657e-05, + "loss": 0.8205, + "mean_token_accuracy": 0.7493108093738556, + "num_tokens": 133475683.0, + "step": 57730 + }, + { + "epoch": 0.5293847987530943, + "learning_rate": 9.412487393417073e-05, + "loss": 0.7904, + "mean_token_accuracy": 0.7551456451416015, + "num_tokens": 133498559.0, + "step": 57740 + }, + { + "epoch": 0.5294764829925735, + "learning_rate": 9.410653708627486e-05, + "loss": 0.7369, + "mean_token_accuracy": 0.7759769082069397, + "num_tokens": 133522020.0, + "step": 57750 + }, + { + "epoch": 0.5295681672320528, + "learning_rate": 9.408820023837903e-05, + "loss": 0.7993, + "mean_token_accuracy": 0.7615691244602203, + "num_tokens": 133545112.0, + "step": 57760 + }, + { + "epoch": 0.529659851471532, + "learning_rate": 9.406986339048318e-05, + "loss": 0.8141, + "mean_token_accuracy": 0.7508325040340423, + "num_tokens": 133569653.0, + "step": 57770 + }, + { + "epoch": 0.5297515357110113, + "learning_rate": 9.405152654258733e-05, + "loss": 0.7997, + "mean_token_accuracy": 0.7645523369312286, + "num_tokens": 133593225.0, + "step": 57780 + }, + { + "epoch": 0.5298432199504906, + "learning_rate": 9.403318969469149e-05, + "loss": 0.8089, + "mean_token_accuracy": 0.7540140330791474, + "num_tokens": 133617163.0, + "step": 57790 + }, + { + "epoch": 0.5299349041899697, + "learning_rate": 9.401485284679564e-05, + "loss": 0.8069, + "mean_token_accuracy": 0.756240439414978, + "num_tokens": 133641186.0, + "step": 57800 + }, + { + "epoch": 0.5300265884294489, + "learning_rate": 9.399651599889979e-05, + "loss": 0.798, + "mean_token_accuracy": 0.7593181669712067, + "num_tokens": 133664755.0, + "step": 57810 + }, + { + "epoch": 0.5301182726689282, + "learning_rate": 9.397817915100394e-05, + "loss": 0.789, + "mean_token_accuracy": 0.7571062684059143, + "num_tokens": 133688104.0, + "step": 57820 + }, + { + "epoch": 0.5302099569084074, + "learning_rate": 9.395984230310811e-05, + "loss": 0.8109, + "mean_token_accuracy": 0.7545394539833069, + "num_tokens": 133712739.0, + "step": 57830 + }, + { + "epoch": 0.5303016411478867, + "learning_rate": 9.394150545521226e-05, + "loss": 0.7615, + "mean_token_accuracy": 0.7724260568618775, + "num_tokens": 133737768.0, + "step": 57840 + }, + { + "epoch": 0.5303933253873659, + "learning_rate": 9.39231686073164e-05, + "loss": 0.7798, + "mean_token_accuracy": 0.7640564382076264, + "num_tokens": 133761290.0, + "step": 57850 + }, + { + "epoch": 0.5304850096268452, + "learning_rate": 9.390483175942056e-05, + "loss": 0.7987, + "mean_token_accuracy": 0.757305258512497, + "num_tokens": 133785048.0, + "step": 57860 + }, + { + "epoch": 0.5305766938663243, + "learning_rate": 9.388649491152471e-05, + "loss": 0.7756, + "mean_token_accuracy": 0.7601220607757568, + "num_tokens": 133808910.0, + "step": 57870 + }, + { + "epoch": 0.5306683781058036, + "learning_rate": 9.386815806362887e-05, + "loss": 0.7884, + "mean_token_accuracy": 0.76932772397995, + "num_tokens": 133832965.0, + "step": 57880 + }, + { + "epoch": 0.5307600623452828, + "learning_rate": 9.384982121573302e-05, + "loss": 0.8328, + "mean_token_accuracy": 0.7507218062877655, + "num_tokens": 133856049.0, + "step": 57890 + }, + { + "epoch": 0.5308517465847621, + "learning_rate": 9.383148436783717e-05, + "loss": 0.7905, + "mean_token_accuracy": 0.7680697858333587, + "num_tokens": 133880539.0, + "step": 57900 + }, + { + "epoch": 0.5309434308242413, + "learning_rate": 9.381314751994132e-05, + "loss": 0.792, + "mean_token_accuracy": 0.7629115223884583, + "num_tokens": 133904651.0, + "step": 57910 + }, + { + "epoch": 0.5310351150637206, + "learning_rate": 9.379481067204547e-05, + "loss": 0.828, + "mean_token_accuracy": 0.7504708647727967, + "num_tokens": 133928674.0, + "step": 57920 + }, + { + "epoch": 0.5311267993031997, + "learning_rate": 9.377647382414964e-05, + "loss": 0.7775, + "mean_token_accuracy": 0.7598287761211395, + "num_tokens": 133952675.0, + "step": 57930 + }, + { + "epoch": 0.531218483542679, + "learning_rate": 9.375813697625379e-05, + "loss": 0.7971, + "mean_token_accuracy": 0.7638172924518585, + "num_tokens": 133976567.0, + "step": 57940 + }, + { + "epoch": 0.5313101677821582, + "learning_rate": 9.373980012835793e-05, + "loss": 0.7929, + "mean_token_accuracy": 0.7637137115001679, + "num_tokens": 134000416.0, + "step": 57950 + }, + { + "epoch": 0.5314018520216375, + "learning_rate": 9.37214632804621e-05, + "loss": 0.8031, + "mean_token_accuracy": 0.7616167545318604, + "num_tokens": 134024444.0, + "step": 57960 + }, + { + "epoch": 0.5314935362611167, + "learning_rate": 9.370312643256625e-05, + "loss": 0.8212, + "mean_token_accuracy": 0.749068558216095, + "num_tokens": 134047944.0, + "step": 57970 + }, + { + "epoch": 0.531585220500596, + "learning_rate": 9.36847895846704e-05, + "loss": 0.8304, + "mean_token_accuracy": 0.752483582496643, + "num_tokens": 134071264.0, + "step": 57980 + }, + { + "epoch": 0.5316769047400752, + "learning_rate": 9.366645273677455e-05, + "loss": 0.7875, + "mean_token_accuracy": 0.7603633165359497, + "num_tokens": 134095233.0, + "step": 57990 + }, + { + "epoch": 0.5317685889795544, + "learning_rate": 9.36481158888787e-05, + "loss": 0.8491, + "mean_token_accuracy": 0.7498716950416565, + "num_tokens": 134119169.0, + "step": 58000 + }, + { + "epoch": 0.5318602732190336, + "learning_rate": 9.362977904098285e-05, + "loss": 0.8036, + "mean_token_accuracy": 0.7566041052341461, + "num_tokens": 134142485.0, + "step": 58010 + }, + { + "epoch": 0.5319519574585129, + "learning_rate": 9.361144219308702e-05, + "loss": 0.7884, + "mean_token_accuracy": 0.7657165229320526, + "num_tokens": 134167175.0, + "step": 58020 + }, + { + "epoch": 0.5320436416979921, + "learning_rate": 9.359310534519117e-05, + "loss": 0.7991, + "mean_token_accuracy": 0.7578857183456421, + "num_tokens": 134190810.0, + "step": 58030 + }, + { + "epoch": 0.5321353259374714, + "learning_rate": 9.357476849729532e-05, + "loss": 0.7823, + "mean_token_accuracy": 0.7648557901382447, + "num_tokens": 134215342.0, + "step": 58040 + }, + { + "epoch": 0.5322270101769506, + "learning_rate": 9.355643164939946e-05, + "loss": 0.8028, + "mean_token_accuracy": 0.7602374613285064, + "num_tokens": 134239388.0, + "step": 58050 + }, + { + "epoch": 0.5323186944164298, + "learning_rate": 9.353809480150363e-05, + "loss": 0.7839, + "mean_token_accuracy": 0.7690163731575013, + "num_tokens": 134262982.0, + "step": 58060 + }, + { + "epoch": 0.532410378655909, + "learning_rate": 9.351975795360778e-05, + "loss": 0.829, + "mean_token_accuracy": 0.7536212086677552, + "num_tokens": 134287338.0, + "step": 58070 + }, + { + "epoch": 0.5325020628953883, + "learning_rate": 9.350142110571193e-05, + "loss": 0.7853, + "mean_token_accuracy": 0.7642540335655212, + "num_tokens": 134311080.0, + "step": 58080 + }, + { + "epoch": 0.5325937471348675, + "learning_rate": 9.348308425781608e-05, + "loss": 0.7322, + "mean_token_accuracy": 0.769903838634491, + "num_tokens": 134334833.0, + "step": 58090 + }, + { + "epoch": 0.5326854313743468, + "learning_rate": 9.346474740992023e-05, + "loss": 0.846, + "mean_token_accuracy": 0.7454536139965058, + "num_tokens": 134358283.0, + "step": 58100 + }, + { + "epoch": 0.532777115613826, + "learning_rate": 9.344641056202439e-05, + "loss": 0.8399, + "mean_token_accuracy": 0.7469364881515503, + "num_tokens": 134381677.0, + "step": 58110 + }, + { + "epoch": 0.5328687998533053, + "learning_rate": 9.342807371412855e-05, + "loss": 0.7936, + "mean_token_accuracy": 0.7565255045890809, + "num_tokens": 134405319.0, + "step": 58120 + }, + { + "epoch": 0.5329604840927844, + "learning_rate": 9.34097368662327e-05, + "loss": 0.8292, + "mean_token_accuracy": 0.7440931677818299, + "num_tokens": 134429221.0, + "step": 58130 + }, + { + "epoch": 0.5330521683322637, + "learning_rate": 9.339140001833686e-05, + "loss": 0.7597, + "mean_token_accuracy": 0.7703822612762451, + "num_tokens": 134454037.0, + "step": 58140 + }, + { + "epoch": 0.5331438525717429, + "learning_rate": 9.337306317044101e-05, + "loss": 0.7616, + "mean_token_accuracy": 0.7670372784137726, + "num_tokens": 134478373.0, + "step": 58150 + }, + { + "epoch": 0.5332355368112222, + "learning_rate": 9.335472632254516e-05, + "loss": 0.7634, + "mean_token_accuracy": 0.7652393400669097, + "num_tokens": 134502345.0, + "step": 58160 + }, + { + "epoch": 0.5333272210507014, + "learning_rate": 9.333638947464931e-05, + "loss": 0.8045, + "mean_token_accuracy": 0.7603592276573181, + "num_tokens": 134526756.0, + "step": 58170 + }, + { + "epoch": 0.5334189052901807, + "learning_rate": 9.331805262675346e-05, + "loss": 0.7985, + "mean_token_accuracy": 0.7629460453987121, + "num_tokens": 134551619.0, + "step": 58180 + }, + { + "epoch": 0.5335105895296599, + "learning_rate": 9.329971577885761e-05, + "loss": 0.7833, + "mean_token_accuracy": 0.7612346410751343, + "num_tokens": 134575385.0, + "step": 58190 + }, + { + "epoch": 0.533602273769139, + "learning_rate": 9.328137893096177e-05, + "loss": 0.7858, + "mean_token_accuracy": 0.766508835554123, + "num_tokens": 134599990.0, + "step": 58200 + }, + { + "epoch": 0.5336939580086183, + "learning_rate": 9.326304208306592e-05, + "loss": 0.7578, + "mean_token_accuracy": 0.7712429940700531, + "num_tokens": 134623671.0, + "step": 58210 + }, + { + "epoch": 0.5337856422480975, + "learning_rate": 9.324470523517008e-05, + "loss": 0.8112, + "mean_token_accuracy": 0.7547142028808593, + "num_tokens": 134647528.0, + "step": 58220 + }, + { + "epoch": 0.5338773264875768, + "learning_rate": 9.322636838727424e-05, + "loss": 0.7885, + "mean_token_accuracy": 0.7550437688827515, + "num_tokens": 134671590.0, + "step": 58230 + }, + { + "epoch": 0.533969010727056, + "learning_rate": 9.320803153937839e-05, + "loss": 0.833, + "mean_token_accuracy": 0.7531205773353576, + "num_tokens": 134694681.0, + "step": 58240 + }, + { + "epoch": 0.5340606949665353, + "learning_rate": 9.318969469148254e-05, + "loss": 0.8013, + "mean_token_accuracy": 0.7594623863697052, + "num_tokens": 134718792.0, + "step": 58250 + }, + { + "epoch": 0.5341523792060144, + "learning_rate": 9.317135784358669e-05, + "loss": 0.7745, + "mean_token_accuracy": 0.7689113557338715, + "num_tokens": 134742825.0, + "step": 58260 + }, + { + "epoch": 0.5342440634454937, + "learning_rate": 9.315302099569084e-05, + "loss": 0.8206, + "mean_token_accuracy": 0.7558790862560272, + "num_tokens": 134765833.0, + "step": 58270 + }, + { + "epoch": 0.5343357476849729, + "learning_rate": 9.313468414779501e-05, + "loss": 0.8419, + "mean_token_accuracy": 0.7577371656894684, + "num_tokens": 134789050.0, + "step": 58280 + }, + { + "epoch": 0.5344274319244522, + "learning_rate": 9.311634729989915e-05, + "loss": 0.7838, + "mean_token_accuracy": 0.7634777903556824, + "num_tokens": 134813759.0, + "step": 58290 + }, + { + "epoch": 0.5345191161639314, + "learning_rate": 9.30980104520033e-05, + "loss": 0.8025, + "mean_token_accuracy": 0.7581336975097657, + "num_tokens": 134836989.0, + "step": 58300 + }, + { + "epoch": 0.5346108004034107, + "learning_rate": 9.307967360410745e-05, + "loss": 0.817, + "mean_token_accuracy": 0.7554428398609161, + "num_tokens": 134860209.0, + "step": 58310 + }, + { + "epoch": 0.5347024846428899, + "learning_rate": 9.306133675621162e-05, + "loss": 0.7948, + "mean_token_accuracy": 0.7627366423606873, + "num_tokens": 134884291.0, + "step": 58320 + }, + { + "epoch": 0.5347941688823691, + "learning_rate": 9.304299990831577e-05, + "loss": 0.8063, + "mean_token_accuracy": 0.7612611770629882, + "num_tokens": 134908434.0, + "step": 58330 + }, + { + "epoch": 0.5348858531218483, + "learning_rate": 9.302466306041992e-05, + "loss": 0.792, + "mean_token_accuracy": 0.7629269242286683, + "num_tokens": 134931790.0, + "step": 58340 + }, + { + "epoch": 0.5349775373613276, + "learning_rate": 9.300632621252407e-05, + "loss": 0.8017, + "mean_token_accuracy": 0.7589909791946411, + "num_tokens": 134955206.0, + "step": 58350 + }, + { + "epoch": 0.5350692216008068, + "learning_rate": 9.298798936462822e-05, + "loss": 0.7313, + "mean_token_accuracy": 0.7748064637184143, + "num_tokens": 134978977.0, + "step": 58360 + }, + { + "epoch": 0.5351609058402861, + "learning_rate": 9.296965251673238e-05, + "loss": 0.775, + "mean_token_accuracy": 0.7637354612350464, + "num_tokens": 135003333.0, + "step": 58370 + }, + { + "epoch": 0.5352525900797653, + "learning_rate": 9.295131566883654e-05, + "loss": 0.8168, + "mean_token_accuracy": 0.7580026090145111, + "num_tokens": 135026926.0, + "step": 58380 + }, + { + "epoch": 0.5353442743192445, + "learning_rate": 9.293297882094068e-05, + "loss": 0.7187, + "mean_token_accuracy": 0.774970269203186, + "num_tokens": 135050773.0, + "step": 58390 + }, + { + "epoch": 0.5354359585587237, + "learning_rate": 9.291464197304483e-05, + "loss": 0.784, + "mean_token_accuracy": 0.7690203487873077, + "num_tokens": 135074446.0, + "step": 58400 + }, + { + "epoch": 0.535527642798203, + "learning_rate": 9.2896305125149e-05, + "loss": 0.7838, + "mean_token_accuracy": 0.7571030974388122, + "num_tokens": 135098895.0, + "step": 58410 + }, + { + "epoch": 0.5356193270376822, + "learning_rate": 9.287796827725315e-05, + "loss": 0.7929, + "mean_token_accuracy": 0.7633040070533752, + "num_tokens": 135122402.0, + "step": 58420 + }, + { + "epoch": 0.5357110112771615, + "learning_rate": 9.28596314293573e-05, + "loss": 0.7882, + "mean_token_accuracy": 0.7635120272636413, + "num_tokens": 135145957.0, + "step": 58430 + }, + { + "epoch": 0.5358026955166407, + "learning_rate": 9.284129458146145e-05, + "loss": 0.7675, + "mean_token_accuracy": 0.7690262854099273, + "num_tokens": 135170375.0, + "step": 58440 + }, + { + "epoch": 0.53589437975612, + "learning_rate": 9.28229577335656e-05, + "loss": 0.7844, + "mean_token_accuracy": 0.7598381519317627, + "num_tokens": 135193863.0, + "step": 58450 + }, + { + "epoch": 0.5359860639955991, + "learning_rate": 9.280462088566976e-05, + "loss": 0.7855, + "mean_token_accuracy": 0.7660774469375611, + "num_tokens": 135218057.0, + "step": 58460 + }, + { + "epoch": 0.5360777482350784, + "learning_rate": 9.278628403777391e-05, + "loss": 0.7669, + "mean_token_accuracy": 0.7679777979850769, + "num_tokens": 135242161.0, + "step": 58470 + }, + { + "epoch": 0.5361694324745576, + "learning_rate": 9.276794718987807e-05, + "loss": 0.7931, + "mean_token_accuracy": 0.7602312386035919, + "num_tokens": 135266361.0, + "step": 58480 + }, + { + "epoch": 0.5362611167140369, + "learning_rate": 9.274961034198221e-05, + "loss": 0.7761, + "mean_token_accuracy": 0.7651449203491211, + "num_tokens": 135290715.0, + "step": 58490 + }, + { + "epoch": 0.5363528009535161, + "learning_rate": 9.273127349408636e-05, + "loss": 0.7851, + "mean_token_accuracy": 0.7679320812225342, + "num_tokens": 135315508.0, + "step": 58500 + }, + { + "epoch": 0.5364444851929954, + "learning_rate": 9.271293664619053e-05, + "loss": 0.7975, + "mean_token_accuracy": 0.7625534296035766, + "num_tokens": 135340418.0, + "step": 58510 + }, + { + "epoch": 0.5365361694324745, + "learning_rate": 9.269459979829468e-05, + "loss": 0.7957, + "mean_token_accuracy": 0.756694632768631, + "num_tokens": 135364927.0, + "step": 58520 + }, + { + "epoch": 0.5366278536719538, + "learning_rate": 9.267626295039883e-05, + "loss": 0.7727, + "mean_token_accuracy": 0.7667570650577545, + "num_tokens": 135389743.0, + "step": 58530 + }, + { + "epoch": 0.536719537911433, + "learning_rate": 9.265792610250298e-05, + "loss": 0.7956, + "mean_token_accuracy": 0.7599010944366456, + "num_tokens": 135413486.0, + "step": 58540 + }, + { + "epoch": 0.5368112221509123, + "learning_rate": 9.263958925460714e-05, + "loss": 0.72, + "mean_token_accuracy": 0.7795994818210602, + "num_tokens": 135439216.0, + "step": 58550 + }, + { + "epoch": 0.5369029063903915, + "learning_rate": 9.262125240671129e-05, + "loss": 0.7862, + "mean_token_accuracy": 0.7627681434154511, + "num_tokens": 135463329.0, + "step": 58560 + }, + { + "epoch": 0.5369945906298708, + "learning_rate": 9.260291555881544e-05, + "loss": 0.818, + "mean_token_accuracy": 0.7461243689060211, + "num_tokens": 135487244.0, + "step": 58570 + }, + { + "epoch": 0.53708627486935, + "learning_rate": 9.25845787109196e-05, + "loss": 0.7813, + "mean_token_accuracy": 0.7591448843479156, + "num_tokens": 135511644.0, + "step": 58580 + }, + { + "epoch": 0.5371779591088292, + "learning_rate": 9.256624186302374e-05, + "loss": 0.7874, + "mean_token_accuracy": 0.7616844713687897, + "num_tokens": 135536113.0, + "step": 58590 + }, + { + "epoch": 0.5372696433483084, + "learning_rate": 9.25479050151279e-05, + "loss": 0.7709, + "mean_token_accuracy": 0.765330970287323, + "num_tokens": 135560046.0, + "step": 58600 + }, + { + "epoch": 0.5373613275877877, + "learning_rate": 9.252956816723206e-05, + "loss": 0.7878, + "mean_token_accuracy": 0.7632694005966186, + "num_tokens": 135584148.0, + "step": 58610 + }, + { + "epoch": 0.5374530118272669, + "learning_rate": 9.251123131933621e-05, + "loss": 0.7176, + "mean_token_accuracy": 0.7732840240001678, + "num_tokens": 135609022.0, + "step": 58620 + }, + { + "epoch": 0.5375446960667462, + "learning_rate": 9.249289447144036e-05, + "loss": 0.7673, + "mean_token_accuracy": 0.7693818151950836, + "num_tokens": 135632757.0, + "step": 58630 + }, + { + "epoch": 0.5376363803062254, + "learning_rate": 9.247455762354452e-05, + "loss": 0.8176, + "mean_token_accuracy": 0.756648164987564, + "num_tokens": 135657576.0, + "step": 58640 + }, + { + "epoch": 0.5377280645457045, + "learning_rate": 9.245622077564867e-05, + "loss": 0.819, + "mean_token_accuracy": 0.7565523028373718, + "num_tokens": 135682154.0, + "step": 58650 + }, + { + "epoch": 0.5378197487851838, + "learning_rate": 9.243788392775282e-05, + "loss": 0.8146, + "mean_token_accuracy": 0.7552489995956421, + "num_tokens": 135706285.0, + "step": 58660 + }, + { + "epoch": 0.537911433024663, + "learning_rate": 9.241954707985697e-05, + "loss": 0.848, + "mean_token_accuracy": 0.7434813380241394, + "num_tokens": 135729514.0, + "step": 58670 + }, + { + "epoch": 0.5380031172641423, + "learning_rate": 9.240121023196114e-05, + "loss": 0.7479, + "mean_token_accuracy": 0.7707680761814117, + "num_tokens": 135753859.0, + "step": 58680 + }, + { + "epoch": 0.5380948015036215, + "learning_rate": 9.238287338406528e-05, + "loss": 0.7827, + "mean_token_accuracy": 0.7675798773765564, + "num_tokens": 135778482.0, + "step": 58690 + }, + { + "epoch": 0.5381864857431008, + "learning_rate": 9.236453653616943e-05, + "loss": 0.7784, + "mean_token_accuracy": 0.7681465446949005, + "num_tokens": 135802610.0, + "step": 58700 + }, + { + "epoch": 0.53827816998258, + "learning_rate": 9.23461996882736e-05, + "loss": 0.8024, + "mean_token_accuracy": 0.7572859346866607, + "num_tokens": 135826238.0, + "step": 58710 + }, + { + "epoch": 0.5383698542220592, + "learning_rate": 9.232786284037775e-05, + "loss": 0.8454, + "mean_token_accuracy": 0.7488239765167236, + "num_tokens": 135849888.0, + "step": 58720 + }, + { + "epoch": 0.5384615384615384, + "learning_rate": 9.23095259924819e-05, + "loss": 0.7609, + "mean_token_accuracy": 0.7731451570987702, + "num_tokens": 135874611.0, + "step": 58730 + }, + { + "epoch": 0.5385532227010177, + "learning_rate": 9.229118914458605e-05, + "loss": 0.762, + "mean_token_accuracy": 0.7702429115772247, + "num_tokens": 135899097.0, + "step": 58740 + }, + { + "epoch": 0.5386449069404969, + "learning_rate": 9.22728522966902e-05, + "loss": 0.8045, + "mean_token_accuracy": 0.7573400974273682, + "num_tokens": 135923927.0, + "step": 58750 + }, + { + "epoch": 0.5387365911799762, + "learning_rate": 9.225451544879435e-05, + "loss": 0.8197, + "mean_token_accuracy": 0.7608265519142151, + "num_tokens": 135948051.0, + "step": 58760 + }, + { + "epoch": 0.5388282754194554, + "learning_rate": 9.223617860089852e-05, + "loss": 0.7554, + "mean_token_accuracy": 0.7739845752716065, + "num_tokens": 135972671.0, + "step": 58770 + }, + { + "epoch": 0.5389199596589346, + "learning_rate": 9.221784175300267e-05, + "loss": 0.7566, + "mean_token_accuracy": 0.7717774510383606, + "num_tokens": 135998399.0, + "step": 58780 + }, + { + "epoch": 0.5390116438984138, + "learning_rate": 9.219950490510681e-05, + "loss": 0.7871, + "mean_token_accuracy": 0.7645931363105773, + "num_tokens": 136022794.0, + "step": 58790 + }, + { + "epoch": 0.5391033281378931, + "learning_rate": 9.218116805721096e-05, + "loss": 0.7565, + "mean_token_accuracy": 0.7741548418998718, + "num_tokens": 136047505.0, + "step": 58800 + }, + { + "epoch": 0.5391950123773723, + "learning_rate": 9.216283120931513e-05, + "loss": 0.7894, + "mean_token_accuracy": 0.7640251398086548, + "num_tokens": 136071039.0, + "step": 58810 + }, + { + "epoch": 0.5392866966168516, + "learning_rate": 9.214449436141928e-05, + "loss": 0.7616, + "mean_token_accuracy": 0.7764576375484467, + "num_tokens": 136095555.0, + "step": 58820 + }, + { + "epoch": 0.5393783808563308, + "learning_rate": 9.212615751352343e-05, + "loss": 0.7591, + "mean_token_accuracy": 0.7665407061576843, + "num_tokens": 136119708.0, + "step": 58830 + }, + { + "epoch": 0.5394700650958101, + "learning_rate": 9.210782066562758e-05, + "loss": 0.803, + "mean_token_accuracy": 0.7570671677589417, + "num_tokens": 136143469.0, + "step": 58840 + }, + { + "epoch": 0.5395617493352892, + "learning_rate": 9.208948381773173e-05, + "loss": 0.8126, + "mean_token_accuracy": 0.7553102552890778, + "num_tokens": 136165962.0, + "step": 58850 + }, + { + "epoch": 0.5396534335747685, + "learning_rate": 9.207114696983588e-05, + "loss": 0.7743, + "mean_token_accuracy": 0.767716646194458, + "num_tokens": 136189494.0, + "step": 58860 + }, + { + "epoch": 0.5397451178142477, + "learning_rate": 9.205281012194005e-05, + "loss": 0.7714, + "mean_token_accuracy": 0.7691974937915802, + "num_tokens": 136213295.0, + "step": 58870 + }, + { + "epoch": 0.539836802053727, + "learning_rate": 9.20344732740442e-05, + "loss": 0.7817, + "mean_token_accuracy": 0.7664900839328765, + "num_tokens": 136235677.0, + "step": 58880 + }, + { + "epoch": 0.5399284862932062, + "learning_rate": 9.201613642614834e-05, + "loss": 0.78, + "mean_token_accuracy": 0.7662824213504791, + "num_tokens": 136259347.0, + "step": 58890 + }, + { + "epoch": 0.5400201705326855, + "learning_rate": 9.19977995782525e-05, + "loss": 0.8049, + "mean_token_accuracy": 0.7642119467258454, + "num_tokens": 136284294.0, + "step": 58900 + }, + { + "epoch": 0.5401118547721646, + "learning_rate": 9.197946273035666e-05, + "loss": 0.7783, + "mean_token_accuracy": 0.7709306061267853, + "num_tokens": 136308767.0, + "step": 58910 + }, + { + "epoch": 0.5402035390116439, + "learning_rate": 9.196112588246081e-05, + "loss": 0.7474, + "mean_token_accuracy": 0.7727955460548401, + "num_tokens": 136332794.0, + "step": 58920 + }, + { + "epoch": 0.5402952232511231, + "learning_rate": 9.194278903456496e-05, + "loss": 0.7869, + "mean_token_accuracy": 0.7615944862365722, + "num_tokens": 136356879.0, + "step": 58930 + }, + { + "epoch": 0.5403869074906024, + "learning_rate": 9.192445218666911e-05, + "loss": 0.7769, + "mean_token_accuracy": 0.7636140763759613, + "num_tokens": 136380377.0, + "step": 58940 + }, + { + "epoch": 0.5404785917300816, + "learning_rate": 9.190611533877327e-05, + "loss": 0.804, + "mean_token_accuracy": 0.7576845228672028, + "num_tokens": 136404768.0, + "step": 58950 + }, + { + "epoch": 0.5405702759695609, + "learning_rate": 9.188777849087742e-05, + "loss": 0.8015, + "mean_token_accuracy": 0.7631287217140198, + "num_tokens": 136429418.0, + "step": 58960 + }, + { + "epoch": 0.5406619602090401, + "learning_rate": 9.186944164298158e-05, + "loss": 0.7953, + "mean_token_accuracy": 0.760073584318161, + "num_tokens": 136453803.0, + "step": 58970 + }, + { + "epoch": 0.5407536444485193, + "learning_rate": 9.185110479508573e-05, + "loss": 0.7551, + "mean_token_accuracy": 0.7727975487709046, + "num_tokens": 136479297.0, + "step": 58980 + }, + { + "epoch": 0.5408453286879985, + "learning_rate": 9.183276794718987e-05, + "loss": 0.7564, + "mean_token_accuracy": 0.7678837537765503, + "num_tokens": 136503667.0, + "step": 58990 + }, + { + "epoch": 0.5409370129274778, + "learning_rate": 9.181443109929404e-05, + "loss": 0.7837, + "mean_token_accuracy": 0.7612081289291381, + "num_tokens": 136527150.0, + "step": 59000 + }, + { + "epoch": 0.541028697166957, + "learning_rate": 9.179609425139819e-05, + "loss": 0.8105, + "mean_token_accuracy": 0.7585221111774445, + "num_tokens": 136550805.0, + "step": 59010 + }, + { + "epoch": 0.5411203814064363, + "learning_rate": 9.177775740350234e-05, + "loss": 0.7932, + "mean_token_accuracy": 0.7661087095737458, + "num_tokens": 136575553.0, + "step": 59020 + }, + { + "epoch": 0.5412120656459155, + "learning_rate": 9.175942055560651e-05, + "loss": 0.7622, + "mean_token_accuracy": 0.763846355676651, + "num_tokens": 136600504.0, + "step": 59030 + }, + { + "epoch": 0.5413037498853946, + "learning_rate": 9.174108370771065e-05, + "loss": 0.789, + "mean_token_accuracy": 0.7613443434238434, + "num_tokens": 136624694.0, + "step": 59040 + }, + { + "epoch": 0.5413954341248739, + "learning_rate": 9.17227468598148e-05, + "loss": 0.7518, + "mean_token_accuracy": 0.7728749930858612, + "num_tokens": 136648358.0, + "step": 59050 + }, + { + "epoch": 0.5414871183643531, + "learning_rate": 9.170441001191895e-05, + "loss": 0.8121, + "mean_token_accuracy": 0.7570838332176208, + "num_tokens": 136672057.0, + "step": 59060 + }, + { + "epoch": 0.5415788026038324, + "learning_rate": 9.168607316402311e-05, + "loss": 0.7983, + "mean_token_accuracy": 0.7637819230556488, + "num_tokens": 136695211.0, + "step": 59070 + }, + { + "epoch": 0.5416704868433116, + "learning_rate": 9.166773631612727e-05, + "loss": 0.7879, + "mean_token_accuracy": 0.7602478384971618, + "num_tokens": 136718855.0, + "step": 59080 + }, + { + "epoch": 0.5417621710827909, + "learning_rate": 9.16493994682314e-05, + "loss": 0.761, + "mean_token_accuracy": 0.7691253364086151, + "num_tokens": 136743036.0, + "step": 59090 + }, + { + "epoch": 0.5418538553222702, + "learning_rate": 9.163106262033557e-05, + "loss": 0.7597, + "mean_token_accuracy": 0.7667005777359008, + "num_tokens": 136767331.0, + "step": 59100 + }, + { + "epoch": 0.5419455395617493, + "learning_rate": 9.161272577243972e-05, + "loss": 0.8674, + "mean_token_accuracy": 0.7464340209960938, + "num_tokens": 136790075.0, + "step": 59110 + }, + { + "epoch": 0.5420372238012285, + "learning_rate": 9.159438892454387e-05, + "loss": 0.832, + "mean_token_accuracy": 0.747848105430603, + "num_tokens": 136815522.0, + "step": 59120 + }, + { + "epoch": 0.5421289080407078, + "learning_rate": 9.157605207664804e-05, + "loss": 0.7869, + "mean_token_accuracy": 0.763346540927887, + "num_tokens": 136839737.0, + "step": 59130 + }, + { + "epoch": 0.542220592280187, + "learning_rate": 9.155771522875218e-05, + "loss": 0.7772, + "mean_token_accuracy": 0.7635484337806702, + "num_tokens": 136863491.0, + "step": 59140 + }, + { + "epoch": 0.5423122765196663, + "learning_rate": 9.153937838085633e-05, + "loss": 0.7502, + "mean_token_accuracy": 0.7703371524810791, + "num_tokens": 136887844.0, + "step": 59150 + }, + { + "epoch": 0.5424039607591455, + "learning_rate": 9.152104153296048e-05, + "loss": 0.7536, + "mean_token_accuracy": 0.770036643743515, + "num_tokens": 136912731.0, + "step": 59160 + }, + { + "epoch": 0.5424956449986247, + "learning_rate": 9.150270468506465e-05, + "loss": 0.7553, + "mean_token_accuracy": 0.769990760087967, + "num_tokens": 136936070.0, + "step": 59170 + }, + { + "epoch": 0.5425873292381039, + "learning_rate": 9.14843678371688e-05, + "loss": 0.7442, + "mean_token_accuracy": 0.773495864868164, + "num_tokens": 136959936.0, + "step": 59180 + }, + { + "epoch": 0.5426790134775832, + "learning_rate": 9.146603098927294e-05, + "loss": 0.7833, + "mean_token_accuracy": 0.7637665331363678, + "num_tokens": 136983865.0, + "step": 59190 + }, + { + "epoch": 0.5427706977170624, + "learning_rate": 9.14476941413771e-05, + "loss": 0.7712, + "mean_token_accuracy": 0.7694948494434357, + "num_tokens": 137007165.0, + "step": 59200 + }, + { + "epoch": 0.5428623819565417, + "learning_rate": 9.142935729348125e-05, + "loss": 0.793, + "mean_token_accuracy": 0.7622173428535461, + "num_tokens": 137031800.0, + "step": 59210 + }, + { + "epoch": 0.5429540661960209, + "learning_rate": 9.14110204455854e-05, + "loss": 0.7354, + "mean_token_accuracy": 0.7782780170440674, + "num_tokens": 137056100.0, + "step": 59220 + }, + { + "epoch": 0.5430457504355002, + "learning_rate": 9.139268359768957e-05, + "loss": 0.7661, + "mean_token_accuracy": 0.7641168296337127, + "num_tokens": 137080410.0, + "step": 59230 + }, + { + "epoch": 0.5431374346749793, + "learning_rate": 9.137434674979371e-05, + "loss": 0.7607, + "mean_token_accuracy": 0.7686898529529571, + "num_tokens": 137104366.0, + "step": 59240 + }, + { + "epoch": 0.5432291189144586, + "learning_rate": 9.135600990189786e-05, + "loss": 0.7683, + "mean_token_accuracy": 0.7621020674705505, + "num_tokens": 137129134.0, + "step": 59250 + }, + { + "epoch": 0.5433208031539378, + "learning_rate": 9.133767305400203e-05, + "loss": 0.7677, + "mean_token_accuracy": 0.7702788650989533, + "num_tokens": 137154523.0, + "step": 59260 + }, + { + "epoch": 0.5434124873934171, + "learning_rate": 9.131933620610618e-05, + "loss": 0.7955, + "mean_token_accuracy": 0.7685214102268219, + "num_tokens": 137179556.0, + "step": 59270 + }, + { + "epoch": 0.5435041716328963, + "learning_rate": 9.130099935821033e-05, + "loss": 0.7984, + "mean_token_accuracy": 0.7586545467376709, + "num_tokens": 137203707.0, + "step": 59280 + }, + { + "epoch": 0.5435958558723756, + "learning_rate": 9.128266251031447e-05, + "loss": 0.7535, + "mean_token_accuracy": 0.7715396046638489, + "num_tokens": 137227419.0, + "step": 59290 + }, + { + "epoch": 0.5436875401118547, + "learning_rate": 9.126432566241863e-05, + "loss": 0.7477, + "mean_token_accuracy": 0.7667481362819671, + "num_tokens": 137251769.0, + "step": 59300 + }, + { + "epoch": 0.543779224351334, + "learning_rate": 9.124598881452279e-05, + "loss": 0.7586, + "mean_token_accuracy": 0.7621158480644226, + "num_tokens": 137276167.0, + "step": 59310 + }, + { + "epoch": 0.5438709085908132, + "learning_rate": 9.122765196662694e-05, + "loss": 0.7935, + "mean_token_accuracy": 0.761205005645752, + "num_tokens": 137300360.0, + "step": 59320 + }, + { + "epoch": 0.5439625928302925, + "learning_rate": 9.12093151187311e-05, + "loss": 0.7793, + "mean_token_accuracy": 0.7672877252101898, + "num_tokens": 137325123.0, + "step": 59330 + }, + { + "epoch": 0.5440542770697717, + "learning_rate": 9.119097827083524e-05, + "loss": 0.7474, + "mean_token_accuracy": 0.773924195766449, + "num_tokens": 137349627.0, + "step": 59340 + }, + { + "epoch": 0.544145961309251, + "learning_rate": 9.11726414229394e-05, + "loss": 0.7736, + "mean_token_accuracy": 0.7691892743110657, + "num_tokens": 137374587.0, + "step": 59350 + }, + { + "epoch": 0.5442376455487302, + "learning_rate": 9.115430457504356e-05, + "loss": 0.7446, + "mean_token_accuracy": 0.7727368533611297, + "num_tokens": 137398954.0, + "step": 59360 + }, + { + "epoch": 0.5443293297882094, + "learning_rate": 9.113596772714771e-05, + "loss": 0.7869, + "mean_token_accuracy": 0.7626693844795227, + "num_tokens": 137422734.0, + "step": 59370 + }, + { + "epoch": 0.5444210140276886, + "learning_rate": 9.111763087925186e-05, + "loss": 0.781, + "mean_token_accuracy": 0.7663978457450866, + "num_tokens": 137446891.0, + "step": 59380 + }, + { + "epoch": 0.5445126982671679, + "learning_rate": 9.109929403135602e-05, + "loss": 0.7744, + "mean_token_accuracy": 0.7736323773860931, + "num_tokens": 137471015.0, + "step": 59390 + }, + { + "epoch": 0.5446043825066471, + "learning_rate": 9.108095718346017e-05, + "loss": 0.7985, + "mean_token_accuracy": 0.7581858396530151, + "num_tokens": 137495436.0, + "step": 59400 + }, + { + "epoch": 0.5446960667461264, + "learning_rate": 9.106262033556432e-05, + "loss": 0.8202, + "mean_token_accuracy": 0.7503768920898437, + "num_tokens": 137519383.0, + "step": 59410 + }, + { + "epoch": 0.5447877509856056, + "learning_rate": 9.104428348766847e-05, + "loss": 0.7861, + "mean_token_accuracy": 0.768260782957077, + "num_tokens": 137544364.0, + "step": 59420 + }, + { + "epoch": 0.5448794352250849, + "learning_rate": 9.102594663977264e-05, + "loss": 0.7689, + "mean_token_accuracy": 0.7657553672790527, + "num_tokens": 137568472.0, + "step": 59430 + }, + { + "epoch": 0.544971119464564, + "learning_rate": 9.100760979187677e-05, + "loss": 0.8023, + "mean_token_accuracy": 0.7602219462394715, + "num_tokens": 137592014.0, + "step": 59440 + }, + { + "epoch": 0.5450628037040433, + "learning_rate": 9.098927294398093e-05, + "loss": 0.7362, + "mean_token_accuracy": 0.7781449675559997, + "num_tokens": 137616381.0, + "step": 59450 + }, + { + "epoch": 0.5451544879435225, + "learning_rate": 9.097093609608509e-05, + "loss": 0.7501, + "mean_token_accuracy": 0.7706298887729645, + "num_tokens": 137641531.0, + "step": 59460 + }, + { + "epoch": 0.5452461721830018, + "learning_rate": 9.095259924818924e-05, + "loss": 0.766, + "mean_token_accuracy": 0.7670444369316101, + "num_tokens": 137665465.0, + "step": 59470 + }, + { + "epoch": 0.545337856422481, + "learning_rate": 9.09342624002934e-05, + "loss": 0.7875, + "mean_token_accuracy": 0.7642770171165466, + "num_tokens": 137689269.0, + "step": 59480 + }, + { + "epoch": 0.5454295406619603, + "learning_rate": 9.091592555239755e-05, + "loss": 0.7614, + "mean_token_accuracy": 0.7682712256908417, + "num_tokens": 137713898.0, + "step": 59490 + }, + { + "epoch": 0.5455212249014394, + "learning_rate": 9.08975887045017e-05, + "loss": 0.7915, + "mean_token_accuracy": 0.7614459991455078, + "num_tokens": 137738114.0, + "step": 59500 + }, + { + "epoch": 0.5456129091409186, + "learning_rate": 9.087925185660585e-05, + "loss": 0.7396, + "mean_token_accuracy": 0.776121324300766, + "num_tokens": 137762528.0, + "step": 59510 + }, + { + "epoch": 0.5457045933803979, + "learning_rate": 9.086091500871002e-05, + "loss": 0.7384, + "mean_token_accuracy": 0.7770536065101623, + "num_tokens": 137786929.0, + "step": 59520 + }, + { + "epoch": 0.5457962776198771, + "learning_rate": 9.084257816081417e-05, + "loss": 0.8456, + "mean_token_accuracy": 0.7492571771144867, + "num_tokens": 137811416.0, + "step": 59530 + }, + { + "epoch": 0.5458879618593564, + "learning_rate": 9.08242413129183e-05, + "loss": 0.7841, + "mean_token_accuracy": 0.7638105869293212, + "num_tokens": 137835907.0, + "step": 59540 + }, + { + "epoch": 0.5459796460988356, + "learning_rate": 9.080590446502246e-05, + "loss": 0.7762, + "mean_token_accuracy": 0.7648620069026947, + "num_tokens": 137858858.0, + "step": 59550 + }, + { + "epoch": 0.5460713303383149, + "learning_rate": 9.078756761712662e-05, + "loss": 0.7516, + "mean_token_accuracy": 0.767018860578537, + "num_tokens": 137883066.0, + "step": 59560 + }, + { + "epoch": 0.546163014577794, + "learning_rate": 9.076923076923078e-05, + "loss": 0.7508, + "mean_token_accuracy": 0.772193866968155, + "num_tokens": 137907861.0, + "step": 59570 + }, + { + "epoch": 0.5462546988172733, + "learning_rate": 9.075089392133493e-05, + "loss": 0.7818, + "mean_token_accuracy": 0.7609135806560516, + "num_tokens": 137931671.0, + "step": 59580 + }, + { + "epoch": 0.5463463830567525, + "learning_rate": 9.073255707343908e-05, + "loss": 0.7457, + "mean_token_accuracy": 0.7700284779071808, + "num_tokens": 137955637.0, + "step": 59590 + }, + { + "epoch": 0.5464380672962318, + "learning_rate": 9.071422022554323e-05, + "loss": 0.7723, + "mean_token_accuracy": 0.7626480221748352, + "num_tokens": 137981083.0, + "step": 59600 + }, + { + "epoch": 0.546529751535711, + "learning_rate": 9.069588337764738e-05, + "loss": 0.7634, + "mean_token_accuracy": 0.7701726138591767, + "num_tokens": 138005180.0, + "step": 59610 + }, + { + "epoch": 0.5466214357751903, + "learning_rate": 9.067754652975155e-05, + "loss": 0.7834, + "mean_token_accuracy": 0.7668368339538574, + "num_tokens": 138028986.0, + "step": 59620 + }, + { + "epoch": 0.5467131200146694, + "learning_rate": 9.06592096818557e-05, + "loss": 0.7772, + "mean_token_accuracy": 0.7639792084693908, + "num_tokens": 138052877.0, + "step": 59630 + }, + { + "epoch": 0.5468048042541487, + "learning_rate": 9.064087283395984e-05, + "loss": 0.7363, + "mean_token_accuracy": 0.7714833319187164, + "num_tokens": 138077288.0, + "step": 59640 + }, + { + "epoch": 0.5468964884936279, + "learning_rate": 9.062253598606399e-05, + "loss": 0.8167, + "mean_token_accuracy": 0.7511677742004395, + "num_tokens": 138101702.0, + "step": 59650 + }, + { + "epoch": 0.5469881727331072, + "learning_rate": 9.060419913816816e-05, + "loss": 0.748, + "mean_token_accuracy": 0.7644962072372437, + "num_tokens": 138125949.0, + "step": 59660 + }, + { + "epoch": 0.5470798569725864, + "learning_rate": 9.058586229027231e-05, + "loss": 0.7367, + "mean_token_accuracy": 0.7778648614883423, + "num_tokens": 138150429.0, + "step": 59670 + }, + { + "epoch": 0.5471715412120657, + "learning_rate": 9.056752544237646e-05, + "loss": 0.7257, + "mean_token_accuracy": 0.7757183253765106, + "num_tokens": 138174301.0, + "step": 59680 + }, + { + "epoch": 0.5472632254515449, + "learning_rate": 9.054918859448061e-05, + "loss": 0.7876, + "mean_token_accuracy": 0.7617397546768189, + "num_tokens": 138198872.0, + "step": 59690 + }, + { + "epoch": 0.5473549096910241, + "learning_rate": 9.053085174658476e-05, + "loss": 0.7193, + "mean_token_accuracy": 0.7781609416007995, + "num_tokens": 138223673.0, + "step": 59700 + }, + { + "epoch": 0.5474465939305033, + "learning_rate": 9.051251489868892e-05, + "loss": 0.7674, + "mean_token_accuracy": 0.7675589799880982, + "num_tokens": 138247443.0, + "step": 59710 + }, + { + "epoch": 0.5475382781699826, + "learning_rate": 9.049417805079308e-05, + "loss": 0.7716, + "mean_token_accuracy": 0.7680305480957031, + "num_tokens": 138271451.0, + "step": 59720 + }, + { + "epoch": 0.5476299624094618, + "learning_rate": 9.047584120289723e-05, + "loss": 0.7624, + "mean_token_accuracy": 0.7677345633506775, + "num_tokens": 138296088.0, + "step": 59730 + }, + { + "epoch": 0.5477216466489411, + "learning_rate": 9.045750435500137e-05, + "loss": 0.7328, + "mean_token_accuracy": 0.7792566597461701, + "num_tokens": 138320598.0, + "step": 59740 + }, + { + "epoch": 0.5478133308884203, + "learning_rate": 9.043916750710554e-05, + "loss": 0.7246, + "mean_token_accuracy": 0.7782040536403656, + "num_tokens": 138345654.0, + "step": 59750 + }, + { + "epoch": 0.5479050151278995, + "learning_rate": 9.042083065920969e-05, + "loss": 0.7558, + "mean_token_accuracy": 0.7744125485420227, + "num_tokens": 138369920.0, + "step": 59760 + }, + { + "epoch": 0.5479966993673787, + "learning_rate": 9.040249381131384e-05, + "loss": 0.7676, + "mean_token_accuracy": 0.764605587720871, + "num_tokens": 138395104.0, + "step": 59770 + }, + { + "epoch": 0.548088383606858, + "learning_rate": 9.038415696341799e-05, + "loss": 0.7749, + "mean_token_accuracy": 0.7652956008911133, + "num_tokens": 138419545.0, + "step": 59780 + }, + { + "epoch": 0.5481800678463372, + "learning_rate": 9.036582011552214e-05, + "loss": 0.7712, + "mean_token_accuracy": 0.7687505304813385, + "num_tokens": 138443242.0, + "step": 59790 + }, + { + "epoch": 0.5482717520858165, + "learning_rate": 9.03474832676263e-05, + "loss": 0.7546, + "mean_token_accuracy": 0.7709036409854889, + "num_tokens": 138467198.0, + "step": 59800 + }, + { + "epoch": 0.5483634363252957, + "learning_rate": 9.032914641973045e-05, + "loss": 0.7685, + "mean_token_accuracy": 0.7652524054050446, + "num_tokens": 138491073.0, + "step": 59810 + }, + { + "epoch": 0.548455120564775, + "learning_rate": 9.031080957183461e-05, + "loss": 0.7621, + "mean_token_accuracy": 0.7733059167861939, + "num_tokens": 138516540.0, + "step": 59820 + }, + { + "epoch": 0.5485468048042541, + "learning_rate": 9.029247272393877e-05, + "loss": 0.7985, + "mean_token_accuracy": 0.7557156145572662, + "num_tokens": 138539771.0, + "step": 59830 + }, + { + "epoch": 0.5486384890437334, + "learning_rate": 9.02741358760429e-05, + "loss": 0.7918, + "mean_token_accuracy": 0.7638346672058105, + "num_tokens": 138564028.0, + "step": 59840 + }, + { + "epoch": 0.5487301732832126, + "learning_rate": 9.025579902814707e-05, + "loss": 0.7895, + "mean_token_accuracy": 0.7664784848690033, + "num_tokens": 138587648.0, + "step": 59850 + }, + { + "epoch": 0.5488218575226919, + "learning_rate": 9.023746218025122e-05, + "loss": 0.797, + "mean_token_accuracy": 0.764485776424408, + "num_tokens": 138611625.0, + "step": 59860 + }, + { + "epoch": 0.5489135417621711, + "learning_rate": 9.021912533235537e-05, + "loss": 0.7629, + "mean_token_accuracy": 0.7619397938251495, + "num_tokens": 138636265.0, + "step": 59870 + }, + { + "epoch": 0.5490052260016504, + "learning_rate": 9.020078848445952e-05, + "loss": 0.753, + "mean_token_accuracy": 0.7711450815200805, + "num_tokens": 138660743.0, + "step": 59880 + }, + { + "epoch": 0.5490969102411295, + "learning_rate": 9.018245163656368e-05, + "loss": 0.7708, + "mean_token_accuracy": 0.7716257810592652, + "num_tokens": 138685011.0, + "step": 59890 + }, + { + "epoch": 0.5491885944806087, + "learning_rate": 9.016411478866783e-05, + "loss": 0.7559, + "mean_token_accuracy": 0.7772553920745849, + "num_tokens": 138709378.0, + "step": 59900 + }, + { + "epoch": 0.549280278720088, + "learning_rate": 9.014577794077198e-05, + "loss": 0.7817, + "mean_token_accuracy": 0.7682043612003326, + "num_tokens": 138733271.0, + "step": 59910 + }, + { + "epoch": 0.5493719629595673, + "learning_rate": 9.012744109287615e-05, + "loss": 0.7461, + "mean_token_accuracy": 0.7688748776912689, + "num_tokens": 138757825.0, + "step": 59920 + }, + { + "epoch": 0.5494636471990465, + "learning_rate": 9.01091042449803e-05, + "loss": 0.7717, + "mean_token_accuracy": 0.7701102018356323, + "num_tokens": 138782084.0, + "step": 59930 + }, + { + "epoch": 0.5495553314385258, + "learning_rate": 9.009076739708444e-05, + "loss": 0.7337, + "mean_token_accuracy": 0.7770924091339111, + "num_tokens": 138806224.0, + "step": 59940 + }, + { + "epoch": 0.549647015678005, + "learning_rate": 9.00724305491886e-05, + "loss": 0.7905, + "mean_token_accuracy": 0.7614732563495636, + "num_tokens": 138830323.0, + "step": 59950 + }, + { + "epoch": 0.5497386999174841, + "learning_rate": 9.005409370129275e-05, + "loss": 0.7217, + "mean_token_accuracy": 0.7798113286495209, + "num_tokens": 138854012.0, + "step": 59960 + }, + { + "epoch": 0.5498303841569634, + "learning_rate": 9.00357568533969e-05, + "loss": 0.757, + "mean_token_accuracy": 0.7711302220821381, + "num_tokens": 138878505.0, + "step": 59970 + }, + { + "epoch": 0.5499220683964426, + "learning_rate": 9.001742000550106e-05, + "loss": 0.7008, + "mean_token_accuracy": 0.7812945306301117, + "num_tokens": 138903120.0, + "step": 59980 + }, + { + "epoch": 0.5500137526359219, + "learning_rate": 8.999908315760521e-05, + "loss": 0.7091, + "mean_token_accuracy": 0.7743261158466339, + "num_tokens": 138927734.0, + "step": 59990 + }, + { + "epoch": 0.5501054368754011, + "learning_rate": 8.998074630970936e-05, + "loss": 0.7105, + "mean_token_accuracy": 0.7869706869125366, + "num_tokens": 138953168.0, + "step": 60000 + }, + { + "epoch": 0.5501971211148804, + "learning_rate": 8.996240946181353e-05, + "loss": 0.8146, + "mean_token_accuracy": 0.7537143945693969, + "num_tokens": 138977485.0, + "step": 60010 + }, + { + "epoch": 0.5502888053543595, + "learning_rate": 8.994407261391768e-05, + "loss": 0.7735, + "mean_token_accuracy": 0.7683954477310181, + "num_tokens": 139001454.0, + "step": 60020 + }, + { + "epoch": 0.5503804895938388, + "learning_rate": 8.992573576602183e-05, + "loss": 0.781, + "mean_token_accuracy": 0.7664335370063782, + "num_tokens": 139025848.0, + "step": 60030 + }, + { + "epoch": 0.550472173833318, + "learning_rate": 8.990739891812597e-05, + "loss": 0.7821, + "mean_token_accuracy": 0.764576894044876, + "num_tokens": 139050485.0, + "step": 60040 + }, + { + "epoch": 0.5505638580727973, + "learning_rate": 8.988906207023013e-05, + "loss": 0.7389, + "mean_token_accuracy": 0.7736314237117767, + "num_tokens": 139074877.0, + "step": 60050 + }, + { + "epoch": 0.5506555423122765, + "learning_rate": 8.987072522233429e-05, + "loss": 0.7397, + "mean_token_accuracy": 0.7742312371730804, + "num_tokens": 139098559.0, + "step": 60060 + }, + { + "epoch": 0.5507472265517558, + "learning_rate": 8.985238837443844e-05, + "loss": 0.7574, + "mean_token_accuracy": 0.76783966422081, + "num_tokens": 139123948.0, + "step": 60070 + }, + { + "epoch": 0.550838910791235, + "learning_rate": 8.983405152654259e-05, + "loss": 0.7296, + "mean_token_accuracy": 0.7761675238609314, + "num_tokens": 139148419.0, + "step": 60080 + }, + { + "epoch": 0.5509305950307142, + "learning_rate": 8.981571467864674e-05, + "loss": 0.7365, + "mean_token_accuracy": 0.7745570719242096, + "num_tokens": 139173088.0, + "step": 60090 + }, + { + "epoch": 0.5510222792701934, + "learning_rate": 8.979737783075089e-05, + "loss": 0.7389, + "mean_token_accuracy": 0.779655647277832, + "num_tokens": 139198318.0, + "step": 60100 + }, + { + "epoch": 0.5511139635096727, + "learning_rate": 8.977904098285506e-05, + "loss": 0.6958, + "mean_token_accuracy": 0.7848239302635193, + "num_tokens": 139222660.0, + "step": 60110 + }, + { + "epoch": 0.5512056477491519, + "learning_rate": 8.976070413495921e-05, + "loss": 0.7385, + "mean_token_accuracy": 0.7779003560543061, + "num_tokens": 139247176.0, + "step": 60120 + }, + { + "epoch": 0.5512973319886312, + "learning_rate": 8.974236728706336e-05, + "loss": 0.7765, + "mean_token_accuracy": 0.7620017051696777, + "num_tokens": 139271464.0, + "step": 60130 + }, + { + "epoch": 0.5513890162281104, + "learning_rate": 8.972403043916751e-05, + "loss": 0.7618, + "mean_token_accuracy": 0.7723858892917633, + "num_tokens": 139294980.0, + "step": 60140 + }, + { + "epoch": 0.5514807004675896, + "learning_rate": 8.970569359127167e-05, + "loss": 0.7605, + "mean_token_accuracy": 0.7708096027374267, + "num_tokens": 139319266.0, + "step": 60150 + }, + { + "epoch": 0.5515723847070688, + "learning_rate": 8.968735674337582e-05, + "loss": 0.7718, + "mean_token_accuracy": 0.7658926963806152, + "num_tokens": 139343814.0, + "step": 60160 + }, + { + "epoch": 0.5516640689465481, + "learning_rate": 8.966901989547997e-05, + "loss": 0.7608, + "mean_token_accuracy": 0.7604470908641815, + "num_tokens": 139367529.0, + "step": 60170 + }, + { + "epoch": 0.5517557531860273, + "learning_rate": 8.965068304758412e-05, + "loss": 0.7396, + "mean_token_accuracy": 0.7774915635585785, + "num_tokens": 139391982.0, + "step": 60180 + }, + { + "epoch": 0.5518474374255066, + "learning_rate": 8.963234619968827e-05, + "loss": 0.7581, + "mean_token_accuracy": 0.7741159200668335, + "num_tokens": 139416174.0, + "step": 60190 + }, + { + "epoch": 0.5519391216649858, + "learning_rate": 8.961400935179242e-05, + "loss": 0.7495, + "mean_token_accuracy": 0.7707136988639831, + "num_tokens": 139441176.0, + "step": 60200 + }, + { + "epoch": 0.5520308059044651, + "learning_rate": 8.959567250389659e-05, + "loss": 0.7823, + "mean_token_accuracy": 0.7647032737731934, + "num_tokens": 139465616.0, + "step": 60210 + }, + { + "epoch": 0.5521224901439442, + "learning_rate": 8.957733565600074e-05, + "loss": 0.7424, + "mean_token_accuracy": 0.7688823223114014, + "num_tokens": 139489643.0, + "step": 60220 + }, + { + "epoch": 0.5522141743834235, + "learning_rate": 8.95589988081049e-05, + "loss": 0.7255, + "mean_token_accuracy": 0.7780394971370697, + "num_tokens": 139513584.0, + "step": 60230 + }, + { + "epoch": 0.5523058586229027, + "learning_rate": 8.954066196020905e-05, + "loss": 0.7664, + "mean_token_accuracy": 0.7680767595767974, + "num_tokens": 139537927.0, + "step": 60240 + }, + { + "epoch": 0.552397542862382, + "learning_rate": 8.95223251123132e-05, + "loss": 0.7172, + "mean_token_accuracy": 0.7776258885860443, + "num_tokens": 139562292.0, + "step": 60250 + }, + { + "epoch": 0.5524892271018612, + "learning_rate": 8.950398826441735e-05, + "loss": 0.7758, + "mean_token_accuracy": 0.7627845525741577, + "num_tokens": 139586080.0, + "step": 60260 + }, + { + "epoch": 0.5525809113413405, + "learning_rate": 8.94856514165215e-05, + "loss": 0.8077, + "mean_token_accuracy": 0.7642762005329132, + "num_tokens": 139609576.0, + "step": 60270 + }, + { + "epoch": 0.5526725955808196, + "learning_rate": 8.946731456862565e-05, + "loss": 0.747, + "mean_token_accuracy": 0.7752709448337555, + "num_tokens": 139634017.0, + "step": 60280 + }, + { + "epoch": 0.5527642798202989, + "learning_rate": 8.94489777207298e-05, + "loss": 0.7868, + "mean_token_accuracy": 0.7587838709354401, + "num_tokens": 139658406.0, + "step": 60290 + }, + { + "epoch": 0.5528559640597781, + "learning_rate": 8.943064087283396e-05, + "loss": 0.7345, + "mean_token_accuracy": 0.7784680187702179, + "num_tokens": 139683175.0, + "step": 60300 + }, + { + "epoch": 0.5529476482992574, + "learning_rate": 8.941230402493812e-05, + "loss": 0.788, + "mean_token_accuracy": 0.7650320649147033, + "num_tokens": 139708314.0, + "step": 60310 + }, + { + "epoch": 0.5530393325387366, + "learning_rate": 8.939396717704227e-05, + "loss": 0.7389, + "mean_token_accuracy": 0.7763622403144836, + "num_tokens": 139733482.0, + "step": 60320 + }, + { + "epoch": 0.5531310167782159, + "learning_rate": 8.937563032914643e-05, + "loss": 0.7976, + "mean_token_accuracy": 0.7633031368255615, + "num_tokens": 139757652.0, + "step": 60330 + }, + { + "epoch": 0.5532227010176951, + "learning_rate": 8.935729348125058e-05, + "loss": 0.7675, + "mean_token_accuracy": 0.766411405801773, + "num_tokens": 139782342.0, + "step": 60340 + }, + { + "epoch": 0.5533143852571742, + "learning_rate": 8.933895663335473e-05, + "loss": 0.7221, + "mean_token_accuracy": 0.7828215837478638, + "num_tokens": 139806368.0, + "step": 60350 + }, + { + "epoch": 0.5534060694966535, + "learning_rate": 8.932061978545888e-05, + "loss": 0.7424, + "mean_token_accuracy": 0.7767630159854889, + "num_tokens": 139830790.0, + "step": 60360 + }, + { + "epoch": 0.5534977537361327, + "learning_rate": 8.930228293756305e-05, + "loss": 0.7327, + "mean_token_accuracy": 0.7781683087348938, + "num_tokens": 139854776.0, + "step": 60370 + }, + { + "epoch": 0.553589437975612, + "learning_rate": 8.928394608966719e-05, + "loss": 0.7548, + "mean_token_accuracy": 0.7682272791862488, + "num_tokens": 139878902.0, + "step": 60380 + }, + { + "epoch": 0.5536811222150912, + "learning_rate": 8.926560924177134e-05, + "loss": 0.7637, + "mean_token_accuracy": 0.7684300899505615, + "num_tokens": 139904005.0, + "step": 60390 + }, + { + "epoch": 0.5537728064545705, + "learning_rate": 8.924727239387549e-05, + "loss": 0.6881, + "mean_token_accuracy": 0.7928227484226227, + "num_tokens": 139928142.0, + "step": 60400 + }, + { + "epoch": 0.5538644906940496, + "learning_rate": 8.922893554597965e-05, + "loss": 0.7226, + "mean_token_accuracy": 0.7775552093982696, + "num_tokens": 139952589.0, + "step": 60410 + }, + { + "epoch": 0.5539561749335289, + "learning_rate": 8.92105986980838e-05, + "loss": 0.7156, + "mean_token_accuracy": 0.7812934756278992, + "num_tokens": 139977972.0, + "step": 60420 + }, + { + "epoch": 0.5540478591730081, + "learning_rate": 8.919226185018796e-05, + "loss": 0.7428, + "mean_token_accuracy": 0.7776130139827728, + "num_tokens": 140003070.0, + "step": 60430 + }, + { + "epoch": 0.5541395434124874, + "learning_rate": 8.917392500229211e-05, + "loss": 0.7745, + "mean_token_accuracy": 0.7657585442066193, + "num_tokens": 140027538.0, + "step": 60440 + }, + { + "epoch": 0.5542312276519666, + "learning_rate": 8.915558815439626e-05, + "loss": 0.769, + "mean_token_accuracy": 0.773032295703888, + "num_tokens": 140052026.0, + "step": 60450 + }, + { + "epoch": 0.5543229118914459, + "learning_rate": 8.913725130650041e-05, + "loss": 0.7769, + "mean_token_accuracy": 0.7604465782642365, + "num_tokens": 140076037.0, + "step": 60460 + }, + { + "epoch": 0.5544145961309251, + "learning_rate": 8.911891445860458e-05, + "loss": 0.7558, + "mean_token_accuracy": 0.7691322803497315, + "num_tokens": 140100191.0, + "step": 60470 + }, + { + "epoch": 0.5545062803704043, + "learning_rate": 8.910057761070872e-05, + "loss": 0.6975, + "mean_token_accuracy": 0.7837631106376648, + "num_tokens": 140125905.0, + "step": 60480 + }, + { + "epoch": 0.5545979646098835, + "learning_rate": 8.908224076281287e-05, + "loss": 0.7599, + "mean_token_accuracy": 0.7748779773712158, + "num_tokens": 140150936.0, + "step": 60490 + }, + { + "epoch": 0.5546896488493628, + "learning_rate": 8.906390391491704e-05, + "loss": 0.7967, + "mean_token_accuracy": 0.7652240335941315, + "num_tokens": 140175616.0, + "step": 60500 + }, + { + "epoch": 0.554781333088842, + "learning_rate": 8.904556706702119e-05, + "loss": 0.7376, + "mean_token_accuracy": 0.7764686822891236, + "num_tokens": 140200453.0, + "step": 60510 + }, + { + "epoch": 0.5548730173283213, + "learning_rate": 8.902723021912534e-05, + "loss": 0.7359, + "mean_token_accuracy": 0.7744403719902039, + "num_tokens": 140224911.0, + "step": 60520 + }, + { + "epoch": 0.5549647015678005, + "learning_rate": 8.900889337122949e-05, + "loss": 0.7671, + "mean_token_accuracy": 0.7694585621356964, + "num_tokens": 140250349.0, + "step": 60530 + }, + { + "epoch": 0.5550563858072798, + "learning_rate": 8.899055652333364e-05, + "loss": 0.7471, + "mean_token_accuracy": 0.7733817458152771, + "num_tokens": 140275980.0, + "step": 60540 + }, + { + "epoch": 0.5551480700467589, + "learning_rate": 8.89722196754378e-05, + "loss": 0.7971, + "mean_token_accuracy": 0.7652704894542695, + "num_tokens": 140299793.0, + "step": 60550 + }, + { + "epoch": 0.5552397542862382, + "learning_rate": 8.895388282754195e-05, + "loss": 0.7787, + "mean_token_accuracy": 0.7674022853374481, + "num_tokens": 140323896.0, + "step": 60560 + }, + { + "epoch": 0.5553314385257174, + "learning_rate": 8.893554597964611e-05, + "loss": 0.7441, + "mean_token_accuracy": 0.7775610744953155, + "num_tokens": 140348789.0, + "step": 60570 + }, + { + "epoch": 0.5554231227651967, + "learning_rate": 8.891720913175025e-05, + "loss": 0.7536, + "mean_token_accuracy": 0.7698719739913941, + "num_tokens": 140373299.0, + "step": 60580 + }, + { + "epoch": 0.5555148070046759, + "learning_rate": 8.88988722838544e-05, + "loss": 0.7086, + "mean_token_accuracy": 0.7829937219619751, + "num_tokens": 140398560.0, + "step": 60590 + }, + { + "epoch": 0.5556064912441552, + "learning_rate": 8.888053543595857e-05, + "loss": 0.7261, + "mean_token_accuracy": 0.7843235313892365, + "num_tokens": 140424358.0, + "step": 60600 + }, + { + "epoch": 0.5556981754836343, + "learning_rate": 8.886219858806272e-05, + "loss": 0.8054, + "mean_token_accuracy": 0.7546370446681976, + "num_tokens": 140447908.0, + "step": 60610 + }, + { + "epoch": 0.5557898597231136, + "learning_rate": 8.884386174016687e-05, + "loss": 0.7462, + "mean_token_accuracy": 0.7767966389656067, + "num_tokens": 140472309.0, + "step": 60620 + }, + { + "epoch": 0.5558815439625928, + "learning_rate": 8.882552489227102e-05, + "loss": 0.7348, + "mean_token_accuracy": 0.7720439910888672, + "num_tokens": 140498085.0, + "step": 60630 + }, + { + "epoch": 0.5559732282020721, + "learning_rate": 8.880718804437517e-05, + "loss": 0.7322, + "mean_token_accuracy": 0.7770056009292603, + "num_tokens": 140522371.0, + "step": 60640 + }, + { + "epoch": 0.5560649124415513, + "learning_rate": 8.878885119647933e-05, + "loss": 0.7247, + "mean_token_accuracy": 0.7749279797077179, + "num_tokens": 140546948.0, + "step": 60650 + }, + { + "epoch": 0.5561565966810306, + "learning_rate": 8.877051434858348e-05, + "loss": 0.7111, + "mean_token_accuracy": 0.778215354681015, + "num_tokens": 140572536.0, + "step": 60660 + }, + { + "epoch": 0.5562482809205098, + "learning_rate": 8.875217750068764e-05, + "loss": 0.744, + "mean_token_accuracy": 0.7755861580371857, + "num_tokens": 140596979.0, + "step": 60670 + }, + { + "epoch": 0.556339965159989, + "learning_rate": 8.873384065279178e-05, + "loss": 0.7289, + "mean_token_accuracy": 0.7835552096366882, + "num_tokens": 140621150.0, + "step": 60680 + }, + { + "epoch": 0.5564316493994682, + "learning_rate": 8.871550380489593e-05, + "loss": 0.7297, + "mean_token_accuracy": 0.7749859631061554, + "num_tokens": 140645648.0, + "step": 60690 + }, + { + "epoch": 0.5565233336389475, + "learning_rate": 8.86971669570001e-05, + "loss": 0.7374, + "mean_token_accuracy": 0.7716366291046143, + "num_tokens": 140670477.0, + "step": 60700 + }, + { + "epoch": 0.5566150178784267, + "learning_rate": 8.867883010910425e-05, + "loss": 0.7237, + "mean_token_accuracy": 0.7810007274150849, + "num_tokens": 140695695.0, + "step": 60710 + }, + { + "epoch": 0.556706702117906, + "learning_rate": 8.86604932612084e-05, + "loss": 0.7525, + "mean_token_accuracy": 0.7683439433574677, + "num_tokens": 140720847.0, + "step": 60720 + }, + { + "epoch": 0.5567983863573852, + "learning_rate": 8.864215641331256e-05, + "loss": 0.7931, + "mean_token_accuracy": 0.7599188685417175, + "num_tokens": 140745014.0, + "step": 60730 + }, + { + "epoch": 0.5568900705968644, + "learning_rate": 8.862381956541671e-05, + "loss": 0.7312, + "mean_token_accuracy": 0.7761836469173431, + "num_tokens": 140769222.0, + "step": 60740 + }, + { + "epoch": 0.5569817548363436, + "learning_rate": 8.860548271752086e-05, + "loss": 0.6983, + "mean_token_accuracy": 0.7895478844642639, + "num_tokens": 140793364.0, + "step": 60750 + }, + { + "epoch": 0.5570734390758229, + "learning_rate": 8.858714586962502e-05, + "loss": 0.7291, + "mean_token_accuracy": 0.7726792871952057, + "num_tokens": 140817259.0, + "step": 60760 + }, + { + "epoch": 0.5571651233153021, + "learning_rate": 8.856880902172918e-05, + "loss": 0.7553, + "mean_token_accuracy": 0.7737743556499481, + "num_tokens": 140842288.0, + "step": 60770 + }, + { + "epoch": 0.5572568075547814, + "learning_rate": 8.855047217383331e-05, + "loss": 0.7161, + "mean_token_accuracy": 0.7794773995876312, + "num_tokens": 140866603.0, + "step": 60780 + }, + { + "epoch": 0.5573484917942606, + "learning_rate": 8.853213532593747e-05, + "loss": 0.7478, + "mean_token_accuracy": 0.7692714989185333, + "num_tokens": 140891440.0, + "step": 60790 + }, + { + "epoch": 0.5574401760337399, + "learning_rate": 8.851379847804163e-05, + "loss": 0.7435, + "mean_token_accuracy": 0.7763656795024871, + "num_tokens": 140916817.0, + "step": 60800 + }, + { + "epoch": 0.557531860273219, + "learning_rate": 8.849546163014578e-05, + "loss": 0.7549, + "mean_token_accuracy": 0.7707635164260864, + "num_tokens": 140941500.0, + "step": 60810 + }, + { + "epoch": 0.5576235445126982, + "learning_rate": 8.847712478224994e-05, + "loss": 0.726, + "mean_token_accuracy": 0.7727028369903565, + "num_tokens": 140966174.0, + "step": 60820 + }, + { + "epoch": 0.5577152287521775, + "learning_rate": 8.845878793435409e-05, + "loss": 0.6845, + "mean_token_accuracy": 0.7924252450466156, + "num_tokens": 140991763.0, + "step": 60830 + }, + { + "epoch": 0.5578069129916567, + "learning_rate": 8.844045108645824e-05, + "loss": 0.6939, + "mean_token_accuracy": 0.7871376514434815, + "num_tokens": 141017056.0, + "step": 60840 + }, + { + "epoch": 0.557898597231136, + "learning_rate": 8.842211423856239e-05, + "loss": 0.7453, + "mean_token_accuracy": 0.7725602924823761, + "num_tokens": 141042096.0, + "step": 60850 + }, + { + "epoch": 0.5579902814706152, + "learning_rate": 8.840377739066656e-05, + "loss": 0.7449, + "mean_token_accuracy": 0.7751950621604919, + "num_tokens": 141066226.0, + "step": 60860 + }, + { + "epoch": 0.5580819657100944, + "learning_rate": 8.838544054277071e-05, + "loss": 0.7084, + "mean_token_accuracy": 0.7858047962188721, + "num_tokens": 141090053.0, + "step": 60870 + }, + { + "epoch": 0.5581736499495736, + "learning_rate": 8.836710369487485e-05, + "loss": 0.7624, + "mean_token_accuracy": 0.7668496429920196, + "num_tokens": 141114729.0, + "step": 60880 + }, + { + "epoch": 0.5582653341890529, + "learning_rate": 8.8348766846979e-05, + "loss": 0.7123, + "mean_token_accuracy": 0.7860641777515411, + "num_tokens": 141140151.0, + "step": 60890 + }, + { + "epoch": 0.5583570184285321, + "learning_rate": 8.833042999908316e-05, + "loss": 0.738, + "mean_token_accuracy": 0.7760488331317902, + "num_tokens": 141165360.0, + "step": 60900 + }, + { + "epoch": 0.5584487026680114, + "learning_rate": 8.831209315118732e-05, + "loss": 0.7782, + "mean_token_accuracy": 0.7627298414707184, + "num_tokens": 141189187.0, + "step": 60910 + }, + { + "epoch": 0.5585403869074906, + "learning_rate": 8.829375630329147e-05, + "loss": 0.7083, + "mean_token_accuracy": 0.7848528623580933, + "num_tokens": 141213872.0, + "step": 60920 + }, + { + "epoch": 0.5586320711469699, + "learning_rate": 8.827541945539562e-05, + "loss": 0.7791, + "mean_token_accuracy": 0.7646727144718171, + "num_tokens": 141238522.0, + "step": 60930 + }, + { + "epoch": 0.558723755386449, + "learning_rate": 8.825708260749977e-05, + "loss": 0.734, + "mean_token_accuracy": 0.7805249214172363, + "num_tokens": 141263361.0, + "step": 60940 + }, + { + "epoch": 0.5588154396259283, + "learning_rate": 8.823874575960392e-05, + "loss": 0.7259, + "mean_token_accuracy": 0.7775725722312927, + "num_tokens": 141287671.0, + "step": 60950 + }, + { + "epoch": 0.5589071238654075, + "learning_rate": 8.822040891170809e-05, + "loss": 0.7474, + "mean_token_accuracy": 0.7717169404029847, + "num_tokens": 141311997.0, + "step": 60960 + }, + { + "epoch": 0.5589988081048868, + "learning_rate": 8.820207206381224e-05, + "loss": 0.6986, + "mean_token_accuracy": 0.7866757810115814, + "num_tokens": 141336475.0, + "step": 60970 + }, + { + "epoch": 0.559090492344366, + "learning_rate": 8.818373521591638e-05, + "loss": 0.7521, + "mean_token_accuracy": 0.7763409078121185, + "num_tokens": 141361489.0, + "step": 60980 + }, + { + "epoch": 0.5591821765838453, + "learning_rate": 8.816539836802054e-05, + "loss": 0.7253, + "mean_token_accuracy": 0.7778802812099457, + "num_tokens": 141386479.0, + "step": 60990 + }, + { + "epoch": 0.5592738608233244, + "learning_rate": 8.81470615201247e-05, + "loss": 0.764, + "mean_token_accuracy": 0.771779590845108, + "num_tokens": 141411513.0, + "step": 61000 + }, + { + "epoch": 0.5593655450628037, + "learning_rate": 8.812872467222885e-05, + "loss": 0.7154, + "mean_token_accuracy": 0.7872254371643066, + "num_tokens": 141436243.0, + "step": 61010 + }, + { + "epoch": 0.5594572293022829, + "learning_rate": 8.8110387824333e-05, + "loss": 0.703, + "mean_token_accuracy": 0.7816587388515472, + "num_tokens": 141461458.0, + "step": 61020 + }, + { + "epoch": 0.5595489135417622, + "learning_rate": 8.809205097643715e-05, + "loss": 0.772, + "mean_token_accuracy": 0.7643976628780365, + "num_tokens": 141485690.0, + "step": 61030 + }, + { + "epoch": 0.5596405977812414, + "learning_rate": 8.80737141285413e-05, + "loss": 0.7591, + "mean_token_accuracy": 0.7725388169288635, + "num_tokens": 141510135.0, + "step": 61040 + }, + { + "epoch": 0.5597322820207207, + "learning_rate": 8.805537728064546e-05, + "loss": 0.7009, + "mean_token_accuracy": 0.7810416221618652, + "num_tokens": 141535028.0, + "step": 61050 + }, + { + "epoch": 0.5598239662601999, + "learning_rate": 8.803704043274962e-05, + "loss": 0.7663, + "mean_token_accuracy": 0.7759714722633362, + "num_tokens": 141559996.0, + "step": 61060 + }, + { + "epoch": 0.5599156504996791, + "learning_rate": 8.801870358485377e-05, + "loss": 0.6954, + "mean_token_accuracy": 0.7873109877109528, + "num_tokens": 141584710.0, + "step": 61070 + }, + { + "epoch": 0.5600073347391583, + "learning_rate": 8.800036673695791e-05, + "loss": 0.7179, + "mean_token_accuracy": 0.781514710187912, + "num_tokens": 141609681.0, + "step": 61080 + }, + { + "epoch": 0.5600990189786376, + "learning_rate": 8.798202988906208e-05, + "loss": 0.742, + "mean_token_accuracy": 0.7753199696540832, + "num_tokens": 141633912.0, + "step": 61090 + }, + { + "epoch": 0.5601907032181168, + "learning_rate": 8.796369304116623e-05, + "loss": 0.7486, + "mean_token_accuracy": 0.7787988245487213, + "num_tokens": 141658106.0, + "step": 61100 + }, + { + "epoch": 0.5602823874575961, + "learning_rate": 8.794535619327038e-05, + "loss": 0.7315, + "mean_token_accuracy": 0.7788116216659546, + "num_tokens": 141682789.0, + "step": 61110 + }, + { + "epoch": 0.5603740716970753, + "learning_rate": 8.792701934537455e-05, + "loss": 0.7377, + "mean_token_accuracy": 0.7705783665180206, + "num_tokens": 141708360.0, + "step": 61120 + }, + { + "epoch": 0.5604657559365545, + "learning_rate": 8.790868249747868e-05, + "loss": 0.7175, + "mean_token_accuracy": 0.788539856672287, + "num_tokens": 141733260.0, + "step": 61130 + }, + { + "epoch": 0.5605574401760337, + "learning_rate": 8.789034564958284e-05, + "loss": 0.7515, + "mean_token_accuracy": 0.7713378965854645, + "num_tokens": 141757752.0, + "step": 61140 + }, + { + "epoch": 0.560649124415513, + "learning_rate": 8.787200880168699e-05, + "loss": 0.7288, + "mean_token_accuracy": 0.7729795396327972, + "num_tokens": 141782487.0, + "step": 61150 + }, + { + "epoch": 0.5607408086549922, + "learning_rate": 8.785367195379115e-05, + "loss": 0.7418, + "mean_token_accuracy": 0.774861353635788, + "num_tokens": 141807675.0, + "step": 61160 + }, + { + "epoch": 0.5608324928944715, + "learning_rate": 8.78353351058953e-05, + "loss": 0.672, + "mean_token_accuracy": 0.7917165219783783, + "num_tokens": 141832580.0, + "step": 61170 + }, + { + "epoch": 0.5609241771339507, + "learning_rate": 8.781699825799944e-05, + "loss": 0.7139, + "mean_token_accuracy": 0.7839303493499756, + "num_tokens": 141857734.0, + "step": 61180 + }, + { + "epoch": 0.56101586137343, + "learning_rate": 8.779866141010361e-05, + "loss": 0.7126, + "mean_token_accuracy": 0.7835335195064544, + "num_tokens": 141882208.0, + "step": 61190 + }, + { + "epoch": 0.5611075456129091, + "learning_rate": 8.778032456220776e-05, + "loss": 0.724, + "mean_token_accuracy": 0.783144611120224, + "num_tokens": 141906932.0, + "step": 61200 + }, + { + "epoch": 0.5611992298523883, + "learning_rate": 8.776198771431191e-05, + "loss": 0.7332, + "mean_token_accuracy": 0.7786126017570496, + "num_tokens": 141931412.0, + "step": 61210 + }, + { + "epoch": 0.5612909140918676, + "learning_rate": 8.774365086641608e-05, + "loss": 0.7439, + "mean_token_accuracy": 0.7730164468288422, + "num_tokens": 141956073.0, + "step": 61220 + }, + { + "epoch": 0.5613825983313468, + "learning_rate": 8.772531401852022e-05, + "loss": 0.7244, + "mean_token_accuracy": 0.7842257678508758, + "num_tokens": 141981534.0, + "step": 61230 + }, + { + "epoch": 0.5614742825708261, + "learning_rate": 8.770697717062437e-05, + "loss": 0.7428, + "mean_token_accuracy": 0.7746395111083985, + "num_tokens": 142005366.0, + "step": 61240 + }, + { + "epoch": 0.5615659668103054, + "learning_rate": 8.768864032272853e-05, + "loss": 0.7043, + "mean_token_accuracy": 0.7825834572315216, + "num_tokens": 142031163.0, + "step": 61250 + }, + { + "epoch": 0.5616576510497845, + "learning_rate": 8.767030347483269e-05, + "loss": 0.7326, + "mean_token_accuracy": 0.7777396857738494, + "num_tokens": 142056016.0, + "step": 61260 + }, + { + "epoch": 0.5617493352892637, + "learning_rate": 8.765196662693684e-05, + "loss": 0.7161, + "mean_token_accuracy": 0.7755993962287903, + "num_tokens": 142080906.0, + "step": 61270 + }, + { + "epoch": 0.561841019528743, + "learning_rate": 8.763362977904098e-05, + "loss": 0.7509, + "mean_token_accuracy": 0.7720266282558441, + "num_tokens": 142105483.0, + "step": 61280 + }, + { + "epoch": 0.5619327037682222, + "learning_rate": 8.761529293114514e-05, + "loss": 0.7531, + "mean_token_accuracy": 0.7713659226894378, + "num_tokens": 142129440.0, + "step": 61290 + }, + { + "epoch": 0.5620243880077015, + "learning_rate": 8.759695608324929e-05, + "loss": 0.7376, + "mean_token_accuracy": 0.7746829330921173, + "num_tokens": 142154420.0, + "step": 61300 + }, + { + "epoch": 0.5621160722471807, + "learning_rate": 8.757861923535344e-05, + "loss": 0.7565, + "mean_token_accuracy": 0.7759364008903503, + "num_tokens": 142179364.0, + "step": 61310 + }, + { + "epoch": 0.56220775648666, + "learning_rate": 8.756028238745761e-05, + "loss": 0.7467, + "mean_token_accuracy": 0.772876912355423, + "num_tokens": 142203813.0, + "step": 61320 + }, + { + "epoch": 0.5622994407261391, + "learning_rate": 8.754194553956175e-05, + "loss": 0.7143, + "mean_token_accuracy": 0.7848659813404083, + "num_tokens": 142229131.0, + "step": 61330 + }, + { + "epoch": 0.5623911249656184, + "learning_rate": 8.75236086916659e-05, + "loss": 0.7897, + "mean_token_accuracy": 0.7600663006305695, + "num_tokens": 142253859.0, + "step": 61340 + }, + { + "epoch": 0.5624828092050976, + "learning_rate": 8.750527184377007e-05, + "loss": 0.7186, + "mean_token_accuracy": 0.7817135035991669, + "num_tokens": 142279014.0, + "step": 61350 + }, + { + "epoch": 0.5625744934445769, + "learning_rate": 8.748693499587422e-05, + "loss": 0.7369, + "mean_token_accuracy": 0.7738412320613861, + "num_tokens": 142304369.0, + "step": 61360 + }, + { + "epoch": 0.5626661776840561, + "learning_rate": 8.746859814797837e-05, + "loss": 0.7277, + "mean_token_accuracy": 0.7809462487697602, + "num_tokens": 142329310.0, + "step": 61370 + }, + { + "epoch": 0.5627578619235354, + "learning_rate": 8.745026130008252e-05, + "loss": 0.7384, + "mean_token_accuracy": 0.7787182092666626, + "num_tokens": 142354353.0, + "step": 61380 + }, + { + "epoch": 0.5628495461630145, + "learning_rate": 8.743192445218667e-05, + "loss": 0.7509, + "mean_token_accuracy": 0.7639503538608551, + "num_tokens": 142378367.0, + "step": 61390 + }, + { + "epoch": 0.5629412304024938, + "learning_rate": 8.741358760429083e-05, + "loss": 0.729, + "mean_token_accuracy": 0.7805909156799317, + "num_tokens": 142403374.0, + "step": 61400 + }, + { + "epoch": 0.563032914641973, + "learning_rate": 8.739525075639498e-05, + "loss": 0.779, + "mean_token_accuracy": 0.765592074394226, + "num_tokens": 142428627.0, + "step": 61410 + }, + { + "epoch": 0.5631245988814523, + "learning_rate": 8.737691390849914e-05, + "loss": 0.7701, + "mean_token_accuracy": 0.7750620067119598, + "num_tokens": 142453343.0, + "step": 61420 + }, + { + "epoch": 0.5632162831209315, + "learning_rate": 8.735857706060328e-05, + "loss": 0.7202, + "mean_token_accuracy": 0.7815834820270539, + "num_tokens": 142478190.0, + "step": 61430 + }, + { + "epoch": 0.5633079673604108, + "learning_rate": 8.734024021270743e-05, + "loss": 0.7378, + "mean_token_accuracy": 0.7742599308490753, + "num_tokens": 142504276.0, + "step": 61440 + }, + { + "epoch": 0.56339965159989, + "learning_rate": 8.73219033648116e-05, + "loss": 0.7224, + "mean_token_accuracy": 0.7844827890396118, + "num_tokens": 142529124.0, + "step": 61450 + }, + { + "epoch": 0.5634913358393692, + "learning_rate": 8.730356651691575e-05, + "loss": 0.717, + "mean_token_accuracy": 0.7813876330852508, + "num_tokens": 142553543.0, + "step": 61460 + }, + { + "epoch": 0.5635830200788484, + "learning_rate": 8.72852296690199e-05, + "loss": 0.7452, + "mean_token_accuracy": 0.773801612854004, + "num_tokens": 142579118.0, + "step": 61470 + }, + { + "epoch": 0.5636747043183277, + "learning_rate": 8.726689282112405e-05, + "loss": 0.7275, + "mean_token_accuracy": 0.7764965236186981, + "num_tokens": 142603774.0, + "step": 61480 + }, + { + "epoch": 0.5637663885578069, + "learning_rate": 8.72485559732282e-05, + "loss": 0.7466, + "mean_token_accuracy": 0.7742263793945312, + "num_tokens": 142629028.0, + "step": 61490 + }, + { + "epoch": 0.5638580727972862, + "learning_rate": 8.723021912533236e-05, + "loss": 0.7397, + "mean_token_accuracy": 0.7819108486175537, + "num_tokens": 142654163.0, + "step": 61500 + }, + { + "epoch": 0.5639497570367654, + "learning_rate": 8.721188227743651e-05, + "loss": 0.7516, + "mean_token_accuracy": 0.772611802816391, + "num_tokens": 142678161.0, + "step": 61510 + }, + { + "epoch": 0.5640414412762446, + "learning_rate": 8.719354542954067e-05, + "loss": 0.7223, + "mean_token_accuracy": 0.7816067576408386, + "num_tokens": 142702549.0, + "step": 61520 + }, + { + "epoch": 0.5641331255157238, + "learning_rate": 8.717520858164481e-05, + "loss": 0.7228, + "mean_token_accuracy": 0.7792167603969574, + "num_tokens": 142728113.0, + "step": 61530 + }, + { + "epoch": 0.5642248097552031, + "learning_rate": 8.715687173374896e-05, + "loss": 0.7361, + "mean_token_accuracy": 0.780789577960968, + "num_tokens": 142753801.0, + "step": 61540 + }, + { + "epoch": 0.5643164939946823, + "learning_rate": 8.713853488585313e-05, + "loss": 0.7092, + "mean_token_accuracy": 0.7850222945213318, + "num_tokens": 142778988.0, + "step": 61550 + }, + { + "epoch": 0.5644081782341616, + "learning_rate": 8.712019803795728e-05, + "loss": 0.7199, + "mean_token_accuracy": 0.7778768181800843, + "num_tokens": 142804062.0, + "step": 61560 + }, + { + "epoch": 0.5644998624736408, + "learning_rate": 8.710186119006143e-05, + "loss": 0.7766, + "mean_token_accuracy": 0.7678954005241394, + "num_tokens": 142828820.0, + "step": 61570 + }, + { + "epoch": 0.5645915467131201, + "learning_rate": 8.708352434216559e-05, + "loss": 0.7465, + "mean_token_accuracy": 0.7716767072677613, + "num_tokens": 142853280.0, + "step": 61580 + }, + { + "epoch": 0.5646832309525992, + "learning_rate": 8.706518749426974e-05, + "loss": 0.7153, + "mean_token_accuracy": 0.7797940015792847, + "num_tokens": 142877595.0, + "step": 61590 + }, + { + "epoch": 0.5647749151920785, + "learning_rate": 8.704685064637389e-05, + "loss": 0.7345, + "mean_token_accuracy": 0.7749894678592681, + "num_tokens": 142902572.0, + "step": 61600 + }, + { + "epoch": 0.5648665994315577, + "learning_rate": 8.702851379847805e-05, + "loss": 0.7219, + "mean_token_accuracy": 0.7763688921928406, + "num_tokens": 142927733.0, + "step": 61610 + }, + { + "epoch": 0.564958283671037, + "learning_rate": 8.701017695058221e-05, + "loss": 0.7349, + "mean_token_accuracy": 0.7736750721931458, + "num_tokens": 142952978.0, + "step": 61620 + }, + { + "epoch": 0.5650499679105162, + "learning_rate": 8.699184010268635e-05, + "loss": 0.7156, + "mean_token_accuracy": 0.786289119720459, + "num_tokens": 142977716.0, + "step": 61630 + }, + { + "epoch": 0.5651416521499955, + "learning_rate": 8.69735032547905e-05, + "loss": 0.7285, + "mean_token_accuracy": 0.7771040678024292, + "num_tokens": 143002377.0, + "step": 61640 + }, + { + "epoch": 0.5652333363894746, + "learning_rate": 8.695516640689466e-05, + "loss": 0.7564, + "mean_token_accuracy": 0.7740037858486175, + "num_tokens": 143027062.0, + "step": 61650 + }, + { + "epoch": 0.5653250206289538, + "learning_rate": 8.693682955899881e-05, + "loss": 0.6785, + "mean_token_accuracy": 0.7890504896640778, + "num_tokens": 143052356.0, + "step": 61660 + }, + { + "epoch": 0.5654167048684331, + "learning_rate": 8.691849271110297e-05, + "loss": 0.7515, + "mean_token_accuracy": 0.7712706089019775, + "num_tokens": 143077597.0, + "step": 61670 + }, + { + "epoch": 0.5655083891079123, + "learning_rate": 8.690015586320712e-05, + "loss": 0.7017, + "mean_token_accuracy": 0.7918259799480438, + "num_tokens": 143102384.0, + "step": 61680 + }, + { + "epoch": 0.5656000733473916, + "learning_rate": 8.688181901531127e-05, + "loss": 0.718, + "mean_token_accuracy": 0.7809239447116851, + "num_tokens": 143127265.0, + "step": 61690 + }, + { + "epoch": 0.5656917575868708, + "learning_rate": 8.686348216741542e-05, + "loss": 0.6947, + "mean_token_accuracy": 0.7870328426361084, + "num_tokens": 143152889.0, + "step": 61700 + }, + { + "epoch": 0.5657834418263501, + "learning_rate": 8.684514531951959e-05, + "loss": 0.7016, + "mean_token_accuracy": 0.7889711618423462, + "num_tokens": 143178063.0, + "step": 61710 + }, + { + "epoch": 0.5658751260658292, + "learning_rate": 8.682680847162374e-05, + "loss": 0.7462, + "mean_token_accuracy": 0.7709170818328858, + "num_tokens": 143203681.0, + "step": 61720 + }, + { + "epoch": 0.5659668103053085, + "learning_rate": 8.680847162372788e-05, + "loss": 0.7135, + "mean_token_accuracy": 0.786488926410675, + "num_tokens": 143229020.0, + "step": 61730 + }, + { + "epoch": 0.5660584945447877, + "learning_rate": 8.679013477583204e-05, + "loss": 0.7145, + "mean_token_accuracy": 0.7814090788364411, + "num_tokens": 143253751.0, + "step": 61740 + }, + { + "epoch": 0.566150178784267, + "learning_rate": 8.67717979279362e-05, + "loss": 0.6934, + "mean_token_accuracy": 0.7881740212440491, + "num_tokens": 143278772.0, + "step": 61750 + }, + { + "epoch": 0.5662418630237462, + "learning_rate": 8.675346108004035e-05, + "loss": 0.7345, + "mean_token_accuracy": 0.7782626450061798, + "num_tokens": 143303803.0, + "step": 61760 + }, + { + "epoch": 0.5663335472632255, + "learning_rate": 8.67351242321445e-05, + "loss": 0.696, + "mean_token_accuracy": 0.7860243439674377, + "num_tokens": 143328999.0, + "step": 61770 + }, + { + "epoch": 0.5664252315027047, + "learning_rate": 8.671678738424865e-05, + "loss": 0.7314, + "mean_token_accuracy": 0.7823576271533966, + "num_tokens": 143354398.0, + "step": 61780 + }, + { + "epoch": 0.5665169157421839, + "learning_rate": 8.66984505363528e-05, + "loss": 0.7147, + "mean_token_accuracy": 0.7784162044525147, + "num_tokens": 143378353.0, + "step": 61790 + }, + { + "epoch": 0.5666085999816631, + "learning_rate": 8.668011368845695e-05, + "loss": 0.7071, + "mean_token_accuracy": 0.7821170151233673, + "num_tokens": 143403959.0, + "step": 61800 + }, + { + "epoch": 0.5667002842211424, + "learning_rate": 8.666177684056112e-05, + "loss": 0.7434, + "mean_token_accuracy": 0.7774074018001557, + "num_tokens": 143429416.0, + "step": 61810 + }, + { + "epoch": 0.5667919684606216, + "learning_rate": 8.664343999266527e-05, + "loss": 0.7473, + "mean_token_accuracy": 0.7764745056629181, + "num_tokens": 143455050.0, + "step": 61820 + }, + { + "epoch": 0.5668836527001009, + "learning_rate": 8.662510314476941e-05, + "loss": 0.7254, + "mean_token_accuracy": 0.7757602453231811, + "num_tokens": 143480438.0, + "step": 61830 + }, + { + "epoch": 0.5669753369395801, + "learning_rate": 8.660676629687358e-05, + "loss": 0.7415, + "mean_token_accuracy": 0.7818674862384796, + "num_tokens": 143503868.0, + "step": 61840 + }, + { + "epoch": 0.5670670211790593, + "learning_rate": 8.658842944897773e-05, + "loss": 0.715, + "mean_token_accuracy": 0.7772590398788453, + "num_tokens": 143527856.0, + "step": 61850 + }, + { + "epoch": 0.5671587054185385, + "learning_rate": 8.657009260108188e-05, + "loss": 0.7384, + "mean_token_accuracy": 0.7781527757644653, + "num_tokens": 143552042.0, + "step": 61860 + }, + { + "epoch": 0.5672503896580178, + "learning_rate": 8.655175575318603e-05, + "loss": 0.7236, + "mean_token_accuracy": 0.7846739411354064, + "num_tokens": 143577375.0, + "step": 61870 + }, + { + "epoch": 0.567342073897497, + "learning_rate": 8.653341890529018e-05, + "loss": 0.7422, + "mean_token_accuracy": 0.7735691845417023, + "num_tokens": 143602524.0, + "step": 61880 + }, + { + "epoch": 0.5674337581369763, + "learning_rate": 8.651508205739433e-05, + "loss": 0.6834, + "mean_token_accuracy": 0.7884851515293121, + "num_tokens": 143627104.0, + "step": 61890 + }, + { + "epoch": 0.5675254423764555, + "learning_rate": 8.649674520949849e-05, + "loss": 0.7026, + "mean_token_accuracy": 0.7839809358119965, + "num_tokens": 143652664.0, + "step": 61900 + }, + { + "epoch": 0.5676171266159348, + "learning_rate": 8.647840836160265e-05, + "loss": 0.7315, + "mean_token_accuracy": 0.7812272548675537, + "num_tokens": 143677592.0, + "step": 61910 + }, + { + "epoch": 0.5677088108554139, + "learning_rate": 8.64600715137068e-05, + "loss": 0.7349, + "mean_token_accuracy": 0.7826238691806793, + "num_tokens": 143702338.0, + "step": 61920 + }, + { + "epoch": 0.5678004950948932, + "learning_rate": 8.644173466581094e-05, + "loss": 0.7132, + "mean_token_accuracy": 0.7844032406806946, + "num_tokens": 143727529.0, + "step": 61930 + }, + { + "epoch": 0.5678921793343724, + "learning_rate": 8.642339781791511e-05, + "loss": 0.7237, + "mean_token_accuracy": 0.7779807567596435, + "num_tokens": 143752375.0, + "step": 61940 + }, + { + "epoch": 0.5679838635738517, + "learning_rate": 8.640506097001926e-05, + "loss": 0.7173, + "mean_token_accuracy": 0.7860865294933319, + "num_tokens": 143776787.0, + "step": 61950 + }, + { + "epoch": 0.5680755478133309, + "learning_rate": 8.638672412212341e-05, + "loss": 0.755, + "mean_token_accuracy": 0.7720317900180816, + "num_tokens": 143801991.0, + "step": 61960 + }, + { + "epoch": 0.5681672320528102, + "learning_rate": 8.636838727422756e-05, + "loss": 0.7483, + "mean_token_accuracy": 0.7743564248085022, + "num_tokens": 143827644.0, + "step": 61970 + }, + { + "epoch": 0.5682589162922893, + "learning_rate": 8.635005042633171e-05, + "loss": 0.6841, + "mean_token_accuracy": 0.7905368804931641, + "num_tokens": 143851690.0, + "step": 61980 + }, + { + "epoch": 0.5683506005317686, + "learning_rate": 8.633171357843587e-05, + "loss": 0.7342, + "mean_token_accuracy": 0.7730114579200744, + "num_tokens": 143876895.0, + "step": 61990 + }, + { + "epoch": 0.5684422847712478, + "learning_rate": 8.631337673054003e-05, + "loss": 0.7443, + "mean_token_accuracy": 0.7728031933307647, + "num_tokens": 143902310.0, + "step": 62000 + }, + { + "epoch": 0.5685339690107271, + "learning_rate": 8.629503988264418e-05, + "loss": 0.7007, + "mean_token_accuracy": 0.7833173513412476, + "num_tokens": 143927201.0, + "step": 62010 + }, + { + "epoch": 0.5686256532502063, + "learning_rate": 8.627670303474834e-05, + "loss": 0.7427, + "mean_token_accuracy": 0.7764660060405731, + "num_tokens": 143951563.0, + "step": 62020 + }, + { + "epoch": 0.5687173374896856, + "learning_rate": 8.625836618685247e-05, + "loss": 0.6761, + "mean_token_accuracy": 0.7847448766231537, + "num_tokens": 143976856.0, + "step": 62030 + }, + { + "epoch": 0.5688090217291648, + "learning_rate": 8.624002933895664e-05, + "loss": 0.7023, + "mean_token_accuracy": 0.7841219067573547, + "num_tokens": 144001330.0, + "step": 62040 + }, + { + "epoch": 0.568900705968644, + "learning_rate": 8.622169249106079e-05, + "loss": 0.7559, + "mean_token_accuracy": 0.773005610704422, + "num_tokens": 144027144.0, + "step": 62050 + }, + { + "epoch": 0.5689923902081232, + "learning_rate": 8.620335564316494e-05, + "loss": 0.6943, + "mean_token_accuracy": 0.7877039730548858, + "num_tokens": 144052308.0, + "step": 62060 + }, + { + "epoch": 0.5690840744476025, + "learning_rate": 8.61850187952691e-05, + "loss": 0.7176, + "mean_token_accuracy": 0.78382129073143, + "num_tokens": 144077742.0, + "step": 62070 + }, + { + "epoch": 0.5691757586870817, + "learning_rate": 8.616668194737325e-05, + "loss": 0.7193, + "mean_token_accuracy": 0.7807154059410095, + "num_tokens": 144103004.0, + "step": 62080 + }, + { + "epoch": 0.569267442926561, + "learning_rate": 8.61483450994774e-05, + "loss": 0.7071, + "mean_token_accuracy": 0.7818564057350159, + "num_tokens": 144127832.0, + "step": 62090 + }, + { + "epoch": 0.5693591271660402, + "learning_rate": 8.613000825158156e-05, + "loss": 0.7316, + "mean_token_accuracy": 0.7813744127750397, + "num_tokens": 144152562.0, + "step": 62100 + }, + { + "epoch": 0.5694508114055193, + "learning_rate": 8.611167140368572e-05, + "loss": 0.7125, + "mean_token_accuracy": 0.7842976093292237, + "num_tokens": 144177810.0, + "step": 62110 + }, + { + "epoch": 0.5695424956449986, + "learning_rate": 8.609333455578987e-05, + "loss": 0.7142, + "mean_token_accuracy": 0.7869325280189514, + "num_tokens": 144202645.0, + "step": 62120 + }, + { + "epoch": 0.5696341798844778, + "learning_rate": 8.6074997707894e-05, + "loss": 0.6733, + "mean_token_accuracy": 0.7955866277217865, + "num_tokens": 144227971.0, + "step": 62130 + }, + { + "epoch": 0.5697258641239571, + "learning_rate": 8.605666085999817e-05, + "loss": 0.7257, + "mean_token_accuracy": 0.7834891974925995, + "num_tokens": 144252837.0, + "step": 62140 + }, + { + "epoch": 0.5698175483634363, + "learning_rate": 8.603832401210232e-05, + "loss": 0.7068, + "mean_token_accuracy": 0.7873168587684631, + "num_tokens": 144278083.0, + "step": 62150 + }, + { + "epoch": 0.5699092326029156, + "learning_rate": 8.601998716420648e-05, + "loss": 0.6749, + "mean_token_accuracy": 0.7899958074092865, + "num_tokens": 144302066.0, + "step": 62160 + }, + { + "epoch": 0.5700009168423948, + "learning_rate": 8.600165031631063e-05, + "loss": 0.7229, + "mean_token_accuracy": 0.7795552492141724, + "num_tokens": 144326831.0, + "step": 62170 + }, + { + "epoch": 0.570092601081874, + "learning_rate": 8.598331346841478e-05, + "loss": 0.7257, + "mean_token_accuracy": 0.7803704261779785, + "num_tokens": 144351891.0, + "step": 62180 + }, + { + "epoch": 0.5701842853213532, + "learning_rate": 8.596497662051893e-05, + "loss": 0.7318, + "mean_token_accuracy": 0.7827034533023834, + "num_tokens": 144377216.0, + "step": 62190 + }, + { + "epoch": 0.5702759695608325, + "learning_rate": 8.59466397726231e-05, + "loss": 0.7335, + "mean_token_accuracy": 0.7783604204654694, + "num_tokens": 144402222.0, + "step": 62200 + }, + { + "epoch": 0.5703676538003117, + "learning_rate": 8.592830292472725e-05, + "loss": 0.6947, + "mean_token_accuracy": 0.7828047335147857, + "num_tokens": 144427150.0, + "step": 62210 + }, + { + "epoch": 0.570459338039791, + "learning_rate": 8.59099660768314e-05, + "loss": 0.7695, + "mean_token_accuracy": 0.763064694404602, + "num_tokens": 144452635.0, + "step": 62220 + }, + { + "epoch": 0.5705510222792702, + "learning_rate": 8.589162922893555e-05, + "loss": 0.6883, + "mean_token_accuracy": 0.7895868837833404, + "num_tokens": 144477485.0, + "step": 62230 + }, + { + "epoch": 0.5706427065187494, + "learning_rate": 8.58732923810397e-05, + "loss": 0.7187, + "mean_token_accuracy": 0.7818442523479462, + "num_tokens": 144501435.0, + "step": 62240 + }, + { + "epoch": 0.5707343907582286, + "learning_rate": 8.585495553314386e-05, + "loss": 0.7464, + "mean_token_accuracy": 0.7730175495147705, + "num_tokens": 144526511.0, + "step": 62250 + }, + { + "epoch": 0.5708260749977079, + "learning_rate": 8.583661868524801e-05, + "loss": 0.6967, + "mean_token_accuracy": 0.7853508651256561, + "num_tokens": 144551349.0, + "step": 62260 + }, + { + "epoch": 0.5709177592371871, + "learning_rate": 8.581828183735216e-05, + "loss": 0.7486, + "mean_token_accuracy": 0.7731032490730285, + "num_tokens": 144576097.0, + "step": 62270 + }, + { + "epoch": 0.5710094434766664, + "learning_rate": 8.579994498945631e-05, + "loss": 0.737, + "mean_token_accuracy": 0.78244908452034, + "num_tokens": 144601027.0, + "step": 62280 + }, + { + "epoch": 0.5711011277161456, + "learning_rate": 8.578160814156046e-05, + "loss": 0.6968, + "mean_token_accuracy": 0.7845434546470642, + "num_tokens": 144626786.0, + "step": 62290 + }, + { + "epoch": 0.5711928119556249, + "learning_rate": 8.576327129366463e-05, + "loss": 0.6985, + "mean_token_accuracy": 0.7877167165279388, + "num_tokens": 144651979.0, + "step": 62300 + }, + { + "epoch": 0.571284496195104, + "learning_rate": 8.574493444576878e-05, + "loss": 0.7196, + "mean_token_accuracy": 0.7870518088340759, + "num_tokens": 144676752.0, + "step": 62310 + }, + { + "epoch": 0.5713761804345833, + "learning_rate": 8.572659759787293e-05, + "loss": 0.6851, + "mean_token_accuracy": 0.788501638174057, + "num_tokens": 144701565.0, + "step": 62320 + }, + { + "epoch": 0.5714678646740625, + "learning_rate": 8.570826074997708e-05, + "loss": 0.7642, + "mean_token_accuracy": 0.7776337265968323, + "num_tokens": 144726064.0, + "step": 62330 + }, + { + "epoch": 0.5715595489135418, + "learning_rate": 8.568992390208124e-05, + "loss": 0.7043, + "mean_token_accuracy": 0.7870524108409882, + "num_tokens": 144751769.0, + "step": 62340 + }, + { + "epoch": 0.571651233153021, + "learning_rate": 8.567158705418539e-05, + "loss": 0.7156, + "mean_token_accuracy": 0.7824094951152801, + "num_tokens": 144776972.0, + "step": 62350 + }, + { + "epoch": 0.5717429173925003, + "learning_rate": 8.565325020628955e-05, + "loss": 0.6874, + "mean_token_accuracy": 0.7920378804206848, + "num_tokens": 144802057.0, + "step": 62360 + }, + { + "epoch": 0.5718346016319794, + "learning_rate": 8.563491335839369e-05, + "loss": 0.7267, + "mean_token_accuracy": 0.7790842652320862, + "num_tokens": 144826664.0, + "step": 62370 + }, + { + "epoch": 0.5719262858714587, + "learning_rate": 8.561657651049784e-05, + "loss": 0.6857, + "mean_token_accuracy": 0.7862694978713989, + "num_tokens": 144851285.0, + "step": 62380 + }, + { + "epoch": 0.5720179701109379, + "learning_rate": 8.5598239662602e-05, + "loss": 0.7211, + "mean_token_accuracy": 0.7760497152805328, + "num_tokens": 144875440.0, + "step": 62390 + }, + { + "epoch": 0.5721096543504172, + "learning_rate": 8.557990281470616e-05, + "loss": 0.7187, + "mean_token_accuracy": 0.7806708574295044, + "num_tokens": 144900548.0, + "step": 62400 + }, + { + "epoch": 0.5722013385898964, + "learning_rate": 8.556156596681031e-05, + "loss": 0.6712, + "mean_token_accuracy": 0.7920472621917725, + "num_tokens": 144925434.0, + "step": 62410 + }, + { + "epoch": 0.5722930228293757, + "learning_rate": 8.554322911891446e-05, + "loss": 0.6869, + "mean_token_accuracy": 0.7868934035301208, + "num_tokens": 144951111.0, + "step": 62420 + }, + { + "epoch": 0.5723847070688549, + "learning_rate": 8.552489227101862e-05, + "loss": 0.6908, + "mean_token_accuracy": 0.7944657862186432, + "num_tokens": 144976139.0, + "step": 62430 + }, + { + "epoch": 0.572476391308334, + "learning_rate": 8.550655542312277e-05, + "loss": 0.7257, + "mean_token_accuracy": 0.7857164978981018, + "num_tokens": 145001543.0, + "step": 62440 + }, + { + "epoch": 0.5725680755478133, + "learning_rate": 8.548821857522692e-05, + "loss": 0.7243, + "mean_token_accuracy": 0.7788842976093292, + "num_tokens": 145026031.0, + "step": 62450 + }, + { + "epoch": 0.5726597597872926, + "learning_rate": 8.546988172733109e-05, + "loss": 0.6661, + "mean_token_accuracy": 0.7954781174659729, + "num_tokens": 145051023.0, + "step": 62460 + }, + { + "epoch": 0.5727514440267718, + "learning_rate": 8.545154487943522e-05, + "loss": 0.7176, + "mean_token_accuracy": 0.7817997395992279, + "num_tokens": 145076003.0, + "step": 62470 + }, + { + "epoch": 0.5728431282662511, + "learning_rate": 8.543320803153938e-05, + "loss": 0.749, + "mean_token_accuracy": 0.7724713504314422, + "num_tokens": 145100516.0, + "step": 62480 + }, + { + "epoch": 0.5729348125057303, + "learning_rate": 8.541487118364354e-05, + "loss": 0.7602, + "mean_token_accuracy": 0.7740296423435211, + "num_tokens": 145124950.0, + "step": 62490 + }, + { + "epoch": 0.5730264967452094, + "learning_rate": 8.539653433574769e-05, + "loss": 0.7428, + "mean_token_accuracy": 0.7710140287876129, + "num_tokens": 145149959.0, + "step": 62500 + }, + { + "epoch": 0.5731181809846887, + "learning_rate": 8.537819748785185e-05, + "loss": 0.7218, + "mean_token_accuracy": 0.7826135754585266, + "num_tokens": 145175594.0, + "step": 62510 + }, + { + "epoch": 0.573209865224168, + "learning_rate": 8.5359860639956e-05, + "loss": 0.689, + "mean_token_accuracy": 0.7823807060718536, + "num_tokens": 145200677.0, + "step": 62520 + }, + { + "epoch": 0.5733015494636472, + "learning_rate": 8.534152379206015e-05, + "loss": 0.7006, + "mean_token_accuracy": 0.7830764055252075, + "num_tokens": 145226189.0, + "step": 62530 + }, + { + "epoch": 0.5733932337031264, + "learning_rate": 8.53231869441643e-05, + "loss": 0.6916, + "mean_token_accuracy": 0.7884008705615997, + "num_tokens": 145250934.0, + "step": 62540 + }, + { + "epoch": 0.5734849179426057, + "learning_rate": 8.530485009626845e-05, + "loss": 0.7046, + "mean_token_accuracy": 0.7841234266757965, + "num_tokens": 145276332.0, + "step": 62550 + }, + { + "epoch": 0.573576602182085, + "learning_rate": 8.528651324837262e-05, + "loss": 0.7187, + "mean_token_accuracy": 0.7814329028129577, + "num_tokens": 145301519.0, + "step": 62560 + }, + { + "epoch": 0.5736682864215641, + "learning_rate": 8.526817640047676e-05, + "loss": 0.6778, + "mean_token_accuracy": 0.7847923219203949, + "num_tokens": 145325973.0, + "step": 62570 + }, + { + "epoch": 0.5737599706610433, + "learning_rate": 8.524983955258091e-05, + "loss": 0.7402, + "mean_token_accuracy": 0.7722189664840698, + "num_tokens": 145350919.0, + "step": 62580 + }, + { + "epoch": 0.5738516549005226, + "learning_rate": 8.523150270468507e-05, + "loss": 0.7065, + "mean_token_accuracy": 0.7750476062297821, + "num_tokens": 145375526.0, + "step": 62590 + }, + { + "epoch": 0.5739433391400018, + "learning_rate": 8.521316585678923e-05, + "loss": 0.6907, + "mean_token_accuracy": 0.782847660779953, + "num_tokens": 145399627.0, + "step": 62600 + }, + { + "epoch": 0.5740350233794811, + "learning_rate": 8.519482900889338e-05, + "loss": 0.7037, + "mean_token_accuracy": 0.7839486539363861, + "num_tokens": 145425176.0, + "step": 62610 + }, + { + "epoch": 0.5741267076189603, + "learning_rate": 8.517649216099753e-05, + "loss": 0.7247, + "mean_token_accuracy": 0.7804330945014953, + "num_tokens": 145450645.0, + "step": 62620 + }, + { + "epoch": 0.5742183918584395, + "learning_rate": 8.515815531310168e-05, + "loss": 0.7109, + "mean_token_accuracy": 0.7823985755443573, + "num_tokens": 145476768.0, + "step": 62630 + }, + { + "epoch": 0.5743100760979187, + "learning_rate": 8.513981846520583e-05, + "loss": 0.6857, + "mean_token_accuracy": 0.7896067500114441, + "num_tokens": 145502852.0, + "step": 62640 + }, + { + "epoch": 0.574401760337398, + "learning_rate": 8.512148161730998e-05, + "loss": 0.7065, + "mean_token_accuracy": 0.7823691308498383, + "num_tokens": 145527394.0, + "step": 62650 + }, + { + "epoch": 0.5744934445768772, + "learning_rate": 8.510314476941415e-05, + "loss": 0.727, + "mean_token_accuracy": 0.7741926550865174, + "num_tokens": 145552203.0, + "step": 62660 + }, + { + "epoch": 0.5745851288163565, + "learning_rate": 8.508480792151829e-05, + "loss": 0.69, + "mean_token_accuracy": 0.7900151491165162, + "num_tokens": 145577248.0, + "step": 62670 + }, + { + "epoch": 0.5746768130558357, + "learning_rate": 8.506647107362244e-05, + "loss": 0.7498, + "mean_token_accuracy": 0.7721031606197357, + "num_tokens": 145601599.0, + "step": 62680 + }, + { + "epoch": 0.574768497295315, + "learning_rate": 8.50481342257266e-05, + "loss": 0.7289, + "mean_token_accuracy": 0.7765326738357544, + "num_tokens": 145626537.0, + "step": 62690 + }, + { + "epoch": 0.5748601815347941, + "learning_rate": 8.502979737783076e-05, + "loss": 0.6884, + "mean_token_accuracy": 0.7924788475036622, + "num_tokens": 145651313.0, + "step": 62700 + }, + { + "epoch": 0.5749518657742734, + "learning_rate": 8.501146052993491e-05, + "loss": 0.7404, + "mean_token_accuracy": 0.7778672039508819, + "num_tokens": 145676890.0, + "step": 62710 + }, + { + "epoch": 0.5750435500137526, + "learning_rate": 8.499312368203906e-05, + "loss": 0.7038, + "mean_token_accuracy": 0.7784171462059021, + "num_tokens": 145701903.0, + "step": 62720 + }, + { + "epoch": 0.5751352342532319, + "learning_rate": 8.497478683414321e-05, + "loss": 0.7525, + "mean_token_accuracy": 0.7763013780117035, + "num_tokens": 145726327.0, + "step": 62730 + }, + { + "epoch": 0.5752269184927111, + "learning_rate": 8.495644998624737e-05, + "loss": 0.704, + "mean_token_accuracy": 0.7827533066272736, + "num_tokens": 145750743.0, + "step": 62740 + }, + { + "epoch": 0.5753186027321904, + "learning_rate": 8.493811313835152e-05, + "loss": 0.6647, + "mean_token_accuracy": 0.7939302027225494, + "num_tokens": 145776675.0, + "step": 62750 + }, + { + "epoch": 0.5754102869716695, + "learning_rate": 8.491977629045568e-05, + "loss": 0.7105, + "mean_token_accuracy": 0.7774204075336456, + "num_tokens": 145801596.0, + "step": 62760 + }, + { + "epoch": 0.5755019712111488, + "learning_rate": 8.490143944255982e-05, + "loss": 0.7042, + "mean_token_accuracy": 0.7891483724117279, + "num_tokens": 145826322.0, + "step": 62770 + }, + { + "epoch": 0.575593655450628, + "learning_rate": 8.488310259466397e-05, + "loss": 0.723, + "mean_token_accuracy": 0.7788620531558991, + "num_tokens": 145850580.0, + "step": 62780 + }, + { + "epoch": 0.5756853396901073, + "learning_rate": 8.486476574676814e-05, + "loss": 0.7541, + "mean_token_accuracy": 0.7751010417938232, + "num_tokens": 145875264.0, + "step": 62790 + }, + { + "epoch": 0.5757770239295865, + "learning_rate": 8.484642889887229e-05, + "loss": 0.748, + "mean_token_accuracy": 0.7660605370998382, + "num_tokens": 145899837.0, + "step": 62800 + }, + { + "epoch": 0.5758687081690658, + "learning_rate": 8.482809205097644e-05, + "loss": 0.7417, + "mean_token_accuracy": 0.7785557568073272, + "num_tokens": 145925004.0, + "step": 62810 + }, + { + "epoch": 0.575960392408545, + "learning_rate": 8.48097552030806e-05, + "loss": 0.7149, + "mean_token_accuracy": 0.7836163759231567, + "num_tokens": 145949662.0, + "step": 62820 + }, + { + "epoch": 0.5760520766480242, + "learning_rate": 8.479141835518475e-05, + "loss": 0.7236, + "mean_token_accuracy": 0.7806240856647492, + "num_tokens": 145973929.0, + "step": 62830 + }, + { + "epoch": 0.5761437608875034, + "learning_rate": 8.47730815072889e-05, + "loss": 0.744, + "mean_token_accuracy": 0.7761898577213288, + "num_tokens": 145999163.0, + "step": 62840 + }, + { + "epoch": 0.5762354451269827, + "learning_rate": 8.475474465939306e-05, + "loss": 0.7314, + "mean_token_accuracy": 0.7833976149559021, + "num_tokens": 146023082.0, + "step": 62850 + }, + { + "epoch": 0.5763271293664619, + "learning_rate": 8.473640781149721e-05, + "loss": 0.7209, + "mean_token_accuracy": 0.7851142287254333, + "num_tokens": 146048387.0, + "step": 62860 + }, + { + "epoch": 0.5764188136059412, + "learning_rate": 8.471807096360135e-05, + "loss": 0.7106, + "mean_token_accuracy": 0.782892906665802, + "num_tokens": 146073149.0, + "step": 62870 + }, + { + "epoch": 0.5765104978454204, + "learning_rate": 8.46997341157055e-05, + "loss": 0.714, + "mean_token_accuracy": 0.782066923379898, + "num_tokens": 146098305.0, + "step": 62880 + }, + { + "epoch": 0.5766021820848996, + "learning_rate": 8.468139726780967e-05, + "loss": 0.7266, + "mean_token_accuracy": 0.7785180389881134, + "num_tokens": 146123449.0, + "step": 62890 + }, + { + "epoch": 0.5766938663243788, + "learning_rate": 8.466306041991382e-05, + "loss": 0.7007, + "mean_token_accuracy": 0.7885490775108337, + "num_tokens": 146148490.0, + "step": 62900 + }, + { + "epoch": 0.576785550563858, + "learning_rate": 8.464472357201797e-05, + "loss": 0.6833, + "mean_token_accuracy": 0.788060975074768, + "num_tokens": 146174302.0, + "step": 62910 + }, + { + "epoch": 0.5768772348033373, + "learning_rate": 8.462638672412213e-05, + "loss": 0.7283, + "mean_token_accuracy": 0.7802075624465943, + "num_tokens": 146199530.0, + "step": 62920 + }, + { + "epoch": 0.5769689190428166, + "learning_rate": 8.460804987622628e-05, + "loss": 0.7556, + "mean_token_accuracy": 0.7705292403697968, + "num_tokens": 146224084.0, + "step": 62930 + }, + { + "epoch": 0.5770606032822958, + "learning_rate": 8.458971302833043e-05, + "loss": 0.7149, + "mean_token_accuracy": 0.7895412623882294, + "num_tokens": 146249644.0, + "step": 62940 + }, + { + "epoch": 0.577152287521775, + "learning_rate": 8.45713761804346e-05, + "loss": 0.7132, + "mean_token_accuracy": 0.7768167138099671, + "num_tokens": 146274811.0, + "step": 62950 + }, + { + "epoch": 0.5772439717612542, + "learning_rate": 8.455303933253875e-05, + "loss": 0.7043, + "mean_token_accuracy": 0.7833518564701081, + "num_tokens": 146299642.0, + "step": 62960 + }, + { + "epoch": 0.5773356560007334, + "learning_rate": 8.453470248464289e-05, + "loss": 0.6982, + "mean_token_accuracy": 0.78038569688797, + "num_tokens": 146324475.0, + "step": 62970 + }, + { + "epoch": 0.5774273402402127, + "learning_rate": 8.451636563674705e-05, + "loss": 0.706, + "mean_token_accuracy": 0.7805178344249726, + "num_tokens": 146349802.0, + "step": 62980 + }, + { + "epoch": 0.577519024479692, + "learning_rate": 8.44980287888512e-05, + "loss": 0.71, + "mean_token_accuracy": 0.7821848571300507, + "num_tokens": 146375188.0, + "step": 62990 + }, + { + "epoch": 0.5776107087191712, + "learning_rate": 8.447969194095535e-05, + "loss": 0.6671, + "mean_token_accuracy": 0.7967598080635071, + "num_tokens": 146400355.0, + "step": 63000 + }, + { + "epoch": 0.5777023929586504, + "learning_rate": 8.44613550930595e-05, + "loss": 0.7242, + "mean_token_accuracy": 0.7823297023773194, + "num_tokens": 146425836.0, + "step": 63010 + }, + { + "epoch": 0.5777940771981297, + "learning_rate": 8.444301824516366e-05, + "loss": 0.7146, + "mean_token_accuracy": 0.7926157057285309, + "num_tokens": 146451347.0, + "step": 63020 + }, + { + "epoch": 0.5778857614376088, + "learning_rate": 8.442468139726781e-05, + "loss": 0.6819, + "mean_token_accuracy": 0.7876127183437347, + "num_tokens": 146476917.0, + "step": 63030 + }, + { + "epoch": 0.5779774456770881, + "learning_rate": 8.440634454937196e-05, + "loss": 0.6825, + "mean_token_accuracy": 0.7935700833797454, + "num_tokens": 146501084.0, + "step": 63040 + }, + { + "epoch": 0.5780691299165673, + "learning_rate": 8.438800770147613e-05, + "loss": 0.7367, + "mean_token_accuracy": 0.7797764360904693, + "num_tokens": 146525975.0, + "step": 63050 + }, + { + "epoch": 0.5781608141560466, + "learning_rate": 8.436967085358028e-05, + "loss": 0.7, + "mean_token_accuracy": 0.7848899662494659, + "num_tokens": 146550896.0, + "step": 63060 + }, + { + "epoch": 0.5782524983955258, + "learning_rate": 8.435133400568442e-05, + "loss": 0.7035, + "mean_token_accuracy": 0.782321286201477, + "num_tokens": 146575765.0, + "step": 63070 + }, + { + "epoch": 0.5783441826350051, + "learning_rate": 8.433299715778858e-05, + "loss": 0.6938, + "mean_token_accuracy": 0.7841570675373077, + "num_tokens": 146600469.0, + "step": 63080 + }, + { + "epoch": 0.5784358668744842, + "learning_rate": 8.431466030989273e-05, + "loss": 0.7374, + "mean_token_accuracy": 0.7760751903057098, + "num_tokens": 146625258.0, + "step": 63090 + }, + { + "epoch": 0.5785275511139635, + "learning_rate": 8.429632346199689e-05, + "loss": 0.7013, + "mean_token_accuracy": 0.7842355668544769, + "num_tokens": 146649761.0, + "step": 63100 + }, + { + "epoch": 0.5786192353534427, + "learning_rate": 8.427798661410105e-05, + "loss": 0.7238, + "mean_token_accuracy": 0.7829664289951325, + "num_tokens": 146674748.0, + "step": 63110 + }, + { + "epoch": 0.578710919592922, + "learning_rate": 8.425964976620519e-05, + "loss": 0.6774, + "mean_token_accuracy": 0.7827253043651581, + "num_tokens": 146699220.0, + "step": 63120 + }, + { + "epoch": 0.5788026038324012, + "learning_rate": 8.424131291830934e-05, + "loss": 0.72, + "mean_token_accuracy": 0.7813050031661988, + "num_tokens": 146724612.0, + "step": 63130 + }, + { + "epoch": 0.5788942880718805, + "learning_rate": 8.42229760704135e-05, + "loss": 0.6826, + "mean_token_accuracy": 0.7871101498603821, + "num_tokens": 146749692.0, + "step": 63140 + }, + { + "epoch": 0.5789859723113597, + "learning_rate": 8.420463922251766e-05, + "loss": 0.7123, + "mean_token_accuracy": 0.7785660862922669, + "num_tokens": 146775434.0, + "step": 63150 + }, + { + "epoch": 0.5790776565508389, + "learning_rate": 8.418630237462181e-05, + "loss": 0.7478, + "mean_token_accuracy": 0.7785642802715301, + "num_tokens": 146799815.0, + "step": 63160 + }, + { + "epoch": 0.5791693407903181, + "learning_rate": 8.416796552672595e-05, + "loss": 0.7073, + "mean_token_accuracy": 0.7834717035293579, + "num_tokens": 146824601.0, + "step": 63170 + }, + { + "epoch": 0.5792610250297974, + "learning_rate": 8.414962867883012e-05, + "loss": 0.7155, + "mean_token_accuracy": 0.7826242804527282, + "num_tokens": 146849643.0, + "step": 63180 + }, + { + "epoch": 0.5793527092692766, + "learning_rate": 8.413129183093427e-05, + "loss": 0.6899, + "mean_token_accuracy": 0.7854468107223511, + "num_tokens": 146874481.0, + "step": 63190 + }, + { + "epoch": 0.5794443935087559, + "learning_rate": 8.411295498303842e-05, + "loss": 0.7339, + "mean_token_accuracy": 0.7812145709991455, + "num_tokens": 146899449.0, + "step": 63200 + }, + { + "epoch": 0.5795360777482351, + "learning_rate": 8.409461813514258e-05, + "loss": 0.7341, + "mean_token_accuracy": 0.779036957025528, + "num_tokens": 146924375.0, + "step": 63210 + }, + { + "epoch": 0.5796277619877143, + "learning_rate": 8.407628128724672e-05, + "loss": 0.6983, + "mean_token_accuracy": 0.7868231296539306, + "num_tokens": 146949424.0, + "step": 63220 + }, + { + "epoch": 0.5797194462271935, + "learning_rate": 8.405794443935087e-05, + "loss": 0.7047, + "mean_token_accuracy": 0.7889563262462616, + "num_tokens": 146973962.0, + "step": 63230 + }, + { + "epoch": 0.5798111304666728, + "learning_rate": 8.403960759145503e-05, + "loss": 0.6897, + "mean_token_accuracy": 0.7857967853546143, + "num_tokens": 147000350.0, + "step": 63240 + }, + { + "epoch": 0.579902814706152, + "learning_rate": 8.402127074355919e-05, + "loss": 0.6933, + "mean_token_accuracy": 0.7878205120563507, + "num_tokens": 147025143.0, + "step": 63250 + }, + { + "epoch": 0.5799944989456313, + "learning_rate": 8.400293389566334e-05, + "loss": 0.6937, + "mean_token_accuracy": 0.7922333836555481, + "num_tokens": 147050652.0, + "step": 63260 + }, + { + "epoch": 0.5800861831851105, + "learning_rate": 8.398459704776748e-05, + "loss": 0.6654, + "mean_token_accuracy": 0.7915775239467621, + "num_tokens": 147075218.0, + "step": 63270 + }, + { + "epoch": 0.5801778674245898, + "learning_rate": 8.396626019987165e-05, + "loss": 0.7133, + "mean_token_accuracy": 0.7793969333171844, + "num_tokens": 147099487.0, + "step": 63280 + }, + { + "epoch": 0.5802695516640689, + "learning_rate": 8.39479233519758e-05, + "loss": 0.67, + "mean_token_accuracy": 0.7927051484584808, + "num_tokens": 147125016.0, + "step": 63290 + }, + { + "epoch": 0.5803612359035482, + "learning_rate": 8.392958650407995e-05, + "loss": 0.6875, + "mean_token_accuracy": 0.78766930103302, + "num_tokens": 147149589.0, + "step": 63300 + }, + { + "epoch": 0.5804529201430274, + "learning_rate": 8.391124965618412e-05, + "loss": 0.6921, + "mean_token_accuracy": 0.7830041944980621, + "num_tokens": 147175048.0, + "step": 63310 + }, + { + "epoch": 0.5805446043825067, + "learning_rate": 8.389291280828825e-05, + "loss": 0.6755, + "mean_token_accuracy": 0.7940853297710418, + "num_tokens": 147199705.0, + "step": 63320 + }, + { + "epoch": 0.5806362886219859, + "learning_rate": 8.38745759603924e-05, + "loss": 0.7063, + "mean_token_accuracy": 0.7832659006118774, + "num_tokens": 147224235.0, + "step": 63330 + }, + { + "epoch": 0.5807279728614652, + "learning_rate": 8.385623911249657e-05, + "loss": 0.7003, + "mean_token_accuracy": 0.7910520970821381, + "num_tokens": 147248895.0, + "step": 63340 + }, + { + "epoch": 0.5808196571009443, + "learning_rate": 8.383790226460072e-05, + "loss": 0.7207, + "mean_token_accuracy": 0.7776158273220062, + "num_tokens": 147273937.0, + "step": 63350 + }, + { + "epoch": 0.5809113413404235, + "learning_rate": 8.381956541670488e-05, + "loss": 0.7092, + "mean_token_accuracy": 0.7816914856433869, + "num_tokens": 147298958.0, + "step": 63360 + }, + { + "epoch": 0.5810030255799028, + "learning_rate": 8.380122856880901e-05, + "loss": 0.7231, + "mean_token_accuracy": 0.7773494303226471, + "num_tokens": 147324865.0, + "step": 63370 + }, + { + "epoch": 0.581094709819382, + "learning_rate": 8.378289172091318e-05, + "loss": 0.7104, + "mean_token_accuracy": 0.7845860540866851, + "num_tokens": 147349623.0, + "step": 63380 + }, + { + "epoch": 0.5811863940588613, + "learning_rate": 8.376455487301733e-05, + "loss": 0.6921, + "mean_token_accuracy": 0.7901294887065887, + "num_tokens": 147374692.0, + "step": 63390 + }, + { + "epoch": 0.5812780782983406, + "learning_rate": 8.374621802512148e-05, + "loss": 0.7043, + "mean_token_accuracy": 0.7841442286968231, + "num_tokens": 147399633.0, + "step": 63400 + }, + { + "epoch": 0.5813697625378198, + "learning_rate": 8.372788117722565e-05, + "loss": 0.7403, + "mean_token_accuracy": 0.7764342486858368, + "num_tokens": 147424120.0, + "step": 63410 + }, + { + "epoch": 0.5814614467772989, + "learning_rate": 8.370954432932979e-05, + "loss": 0.716, + "mean_token_accuracy": 0.7835156202316285, + "num_tokens": 147448945.0, + "step": 63420 + }, + { + "epoch": 0.5815531310167782, + "learning_rate": 8.369120748143394e-05, + "loss": 0.7196, + "mean_token_accuracy": 0.7828741073608398, + "num_tokens": 147473602.0, + "step": 63430 + }, + { + "epoch": 0.5816448152562574, + "learning_rate": 8.36728706335381e-05, + "loss": 0.7073, + "mean_token_accuracy": 0.781675374507904, + "num_tokens": 147499587.0, + "step": 63440 + }, + { + "epoch": 0.5817364994957367, + "learning_rate": 8.365453378564226e-05, + "loss": 0.6948, + "mean_token_accuracy": 0.7856381833553314, + "num_tokens": 147525153.0, + "step": 63450 + }, + { + "epoch": 0.5818281837352159, + "learning_rate": 8.363619693774641e-05, + "loss": 0.709, + "mean_token_accuracy": 0.7836725771427154, + "num_tokens": 147550029.0, + "step": 63460 + }, + { + "epoch": 0.5819198679746952, + "learning_rate": 8.361786008985056e-05, + "loss": 0.6773, + "mean_token_accuracy": 0.7861979365348816, + "num_tokens": 147575441.0, + "step": 63470 + }, + { + "epoch": 0.5820115522141743, + "learning_rate": 8.359952324195471e-05, + "loss": 0.7022, + "mean_token_accuracy": 0.7886620819568634, + "num_tokens": 147600306.0, + "step": 63480 + }, + { + "epoch": 0.5821032364536536, + "learning_rate": 8.358118639405886e-05, + "loss": 0.7168, + "mean_token_accuracy": 0.7807242631912231, + "num_tokens": 147626353.0, + "step": 63490 + }, + { + "epoch": 0.5821949206931328, + "learning_rate": 8.356284954616302e-05, + "loss": 0.7286, + "mean_token_accuracy": 0.7790759265422821, + "num_tokens": 147651737.0, + "step": 63500 + }, + { + "epoch": 0.5822866049326121, + "learning_rate": 8.354451269826718e-05, + "loss": 0.6747, + "mean_token_accuracy": 0.7957220733165741, + "num_tokens": 147677184.0, + "step": 63510 + }, + { + "epoch": 0.5823782891720913, + "learning_rate": 8.352617585037132e-05, + "loss": 0.7245, + "mean_token_accuracy": 0.7769837498664856, + "num_tokens": 147702055.0, + "step": 63520 + }, + { + "epoch": 0.5824699734115706, + "learning_rate": 8.350783900247547e-05, + "loss": 0.74, + "mean_token_accuracy": 0.7733043849468231, + "num_tokens": 147727300.0, + "step": 63530 + }, + { + "epoch": 0.5825616576510498, + "learning_rate": 8.348950215457964e-05, + "loss": 0.7145, + "mean_token_accuracy": 0.7838710427284241, + "num_tokens": 147752010.0, + "step": 63540 + }, + { + "epoch": 0.582653341890529, + "learning_rate": 8.347116530668379e-05, + "loss": 0.7141, + "mean_token_accuracy": 0.7834075629711151, + "num_tokens": 147777880.0, + "step": 63550 + }, + { + "epoch": 0.5827450261300082, + "learning_rate": 8.345282845878794e-05, + "loss": 0.7124, + "mean_token_accuracy": 0.7875271916389466, + "num_tokens": 147802601.0, + "step": 63560 + }, + { + "epoch": 0.5828367103694875, + "learning_rate": 8.343449161089209e-05, + "loss": 0.6932, + "mean_token_accuracy": 0.7834922552108765, + "num_tokens": 147827355.0, + "step": 63570 + }, + { + "epoch": 0.5829283946089667, + "learning_rate": 8.341615476299624e-05, + "loss": 0.6954, + "mean_token_accuracy": 0.7847265064716339, + "num_tokens": 147851731.0, + "step": 63580 + }, + { + "epoch": 0.583020078848446, + "learning_rate": 8.33978179151004e-05, + "loss": 0.7342, + "mean_token_accuracy": 0.7769253015518188, + "num_tokens": 147876658.0, + "step": 63590 + }, + { + "epoch": 0.5831117630879252, + "learning_rate": 8.337948106720456e-05, + "loss": 0.7238, + "mean_token_accuracy": 0.7845895290374756, + "num_tokens": 147901547.0, + "step": 63600 + }, + { + "epoch": 0.5832034473274044, + "learning_rate": 8.336114421930871e-05, + "loss": 0.6858, + "mean_token_accuracy": 0.7881172716617584, + "num_tokens": 147927705.0, + "step": 63610 + }, + { + "epoch": 0.5832951315668836, + "learning_rate": 8.334280737141285e-05, + "loss": 0.6666, + "mean_token_accuracy": 0.7966143131256104, + "num_tokens": 147952671.0, + "step": 63620 + }, + { + "epoch": 0.5833868158063629, + "learning_rate": 8.3324470523517e-05, + "loss": 0.7122, + "mean_token_accuracy": 0.7883368730545044, + "num_tokens": 147977885.0, + "step": 63630 + }, + { + "epoch": 0.5834785000458421, + "learning_rate": 8.330613367562117e-05, + "loss": 0.7077, + "mean_token_accuracy": 0.7859804272651673, + "num_tokens": 148002936.0, + "step": 63640 + }, + { + "epoch": 0.5835701842853214, + "learning_rate": 8.328779682772532e-05, + "loss": 0.7072, + "mean_token_accuracy": 0.7861575543880462, + "num_tokens": 148028204.0, + "step": 63650 + }, + { + "epoch": 0.5836618685248006, + "learning_rate": 8.326945997982947e-05, + "loss": 0.7054, + "mean_token_accuracy": 0.7846588015556335, + "num_tokens": 148053259.0, + "step": 63660 + }, + { + "epoch": 0.5837535527642799, + "learning_rate": 8.325112313193362e-05, + "loss": 0.7082, + "mean_token_accuracy": 0.7851105570793152, + "num_tokens": 148077422.0, + "step": 63670 + }, + { + "epoch": 0.583845237003759, + "learning_rate": 8.323278628403778e-05, + "loss": 0.6979, + "mean_token_accuracy": 0.7855910003185272, + "num_tokens": 148102286.0, + "step": 63680 + }, + { + "epoch": 0.5839369212432383, + "learning_rate": 8.321444943614193e-05, + "loss": 0.6712, + "mean_token_accuracy": 0.7927249848842621, + "num_tokens": 148127324.0, + "step": 63690 + }, + { + "epoch": 0.5840286054827175, + "learning_rate": 8.31961125882461e-05, + "loss": 0.7181, + "mean_token_accuracy": 0.777326476573944, + "num_tokens": 148153074.0, + "step": 63700 + }, + { + "epoch": 0.5841202897221968, + "learning_rate": 8.317777574035025e-05, + "loss": 0.7108, + "mean_token_accuracy": 0.7857874810695649, + "num_tokens": 148178756.0, + "step": 63710 + }, + { + "epoch": 0.584211973961676, + "learning_rate": 8.315943889245438e-05, + "loss": 0.6583, + "mean_token_accuracy": 0.7944095849990844, + "num_tokens": 148204506.0, + "step": 63720 + }, + { + "epoch": 0.5843036582011553, + "learning_rate": 8.314110204455855e-05, + "loss": 0.7002, + "mean_token_accuracy": 0.7815732777118682, + "num_tokens": 148229454.0, + "step": 63730 + }, + { + "epoch": 0.5843953424406344, + "learning_rate": 8.31227651966627e-05, + "loss": 0.7299, + "mean_token_accuracy": 0.7798981308937073, + "num_tokens": 148254914.0, + "step": 63740 + }, + { + "epoch": 0.5844870266801137, + "learning_rate": 8.310442834876685e-05, + "loss": 0.6703, + "mean_token_accuracy": 0.7941282093524933, + "num_tokens": 148279383.0, + "step": 63750 + }, + { + "epoch": 0.5845787109195929, + "learning_rate": 8.3086091500871e-05, + "loss": 0.7003, + "mean_token_accuracy": 0.7854337990283966, + "num_tokens": 148304264.0, + "step": 63760 + }, + { + "epoch": 0.5846703951590722, + "learning_rate": 8.306775465297516e-05, + "loss": 0.734, + "mean_token_accuracy": 0.7756215274333954, + "num_tokens": 148329299.0, + "step": 63770 + }, + { + "epoch": 0.5847620793985514, + "learning_rate": 8.304941780507931e-05, + "loss": 0.6839, + "mean_token_accuracy": 0.7873515009880065, + "num_tokens": 148354155.0, + "step": 63780 + }, + { + "epoch": 0.5848537636380307, + "learning_rate": 8.303108095718346e-05, + "loss": 0.7098, + "mean_token_accuracy": 0.78629270195961, + "num_tokens": 148378644.0, + "step": 63790 + }, + { + "epoch": 0.5849454478775099, + "learning_rate": 8.301274410928763e-05, + "loss": 0.6794, + "mean_token_accuracy": 0.7919967710971832, + "num_tokens": 148403780.0, + "step": 63800 + }, + { + "epoch": 0.585037132116989, + "learning_rate": 8.299440726139178e-05, + "loss": 0.7437, + "mean_token_accuracy": 0.7779891729354859, + "num_tokens": 148428929.0, + "step": 63810 + }, + { + "epoch": 0.5851288163564683, + "learning_rate": 8.297607041349592e-05, + "loss": 0.7112, + "mean_token_accuracy": 0.784506893157959, + "num_tokens": 148454712.0, + "step": 63820 + }, + { + "epoch": 0.5852205005959475, + "learning_rate": 8.295773356560008e-05, + "loss": 0.6677, + "mean_token_accuracy": 0.7959107160568237, + "num_tokens": 148480565.0, + "step": 63830 + }, + { + "epoch": 0.5853121848354268, + "learning_rate": 8.293939671770423e-05, + "loss": 0.6874, + "mean_token_accuracy": 0.7842214405536652, + "num_tokens": 148505519.0, + "step": 63840 + }, + { + "epoch": 0.585403869074906, + "learning_rate": 8.292105986980839e-05, + "loss": 0.6732, + "mean_token_accuracy": 0.7953565776348114, + "num_tokens": 148530671.0, + "step": 63850 + }, + { + "epoch": 0.5854955533143853, + "learning_rate": 8.290272302191254e-05, + "loss": 0.7078, + "mean_token_accuracy": 0.7895129323005676, + "num_tokens": 148555245.0, + "step": 63860 + }, + { + "epoch": 0.5855872375538644, + "learning_rate": 8.288438617401669e-05, + "loss": 0.6757, + "mean_token_accuracy": 0.789818549156189, + "num_tokens": 148580095.0, + "step": 63870 + }, + { + "epoch": 0.5856789217933437, + "learning_rate": 8.286604932612084e-05, + "loss": 0.7043, + "mean_token_accuracy": 0.7819573879241943, + "num_tokens": 148605190.0, + "step": 63880 + }, + { + "epoch": 0.5857706060328229, + "learning_rate": 8.284771247822499e-05, + "loss": 0.7285, + "mean_token_accuracy": 0.7796127200126648, + "num_tokens": 148629971.0, + "step": 63890 + }, + { + "epoch": 0.5858622902723022, + "learning_rate": 8.282937563032916e-05, + "loss": 0.703, + "mean_token_accuracy": 0.7765686392784119, + "num_tokens": 148654816.0, + "step": 63900 + }, + { + "epoch": 0.5859539745117814, + "learning_rate": 8.281103878243331e-05, + "loss": 0.706, + "mean_token_accuracy": 0.7846543312072753, + "num_tokens": 148679096.0, + "step": 63910 + }, + { + "epoch": 0.5860456587512607, + "learning_rate": 8.279270193453745e-05, + "loss": 0.7324, + "mean_token_accuracy": 0.7754747748374939, + "num_tokens": 148704015.0, + "step": 63920 + }, + { + "epoch": 0.5861373429907399, + "learning_rate": 8.277436508664161e-05, + "loss": 0.6661, + "mean_token_accuracy": 0.7943182706832885, + "num_tokens": 148728561.0, + "step": 63930 + }, + { + "epoch": 0.5862290272302191, + "learning_rate": 8.275602823874577e-05, + "loss": 0.6813, + "mean_token_accuracy": 0.7870662689208985, + "num_tokens": 148753393.0, + "step": 63940 + }, + { + "epoch": 0.5863207114696983, + "learning_rate": 8.273769139084992e-05, + "loss": 0.6776, + "mean_token_accuracy": 0.7936405122280121, + "num_tokens": 148778269.0, + "step": 63950 + }, + { + "epoch": 0.5864123957091776, + "learning_rate": 8.271935454295407e-05, + "loss": 0.687, + "mean_token_accuracy": 0.7924061715602875, + "num_tokens": 148803149.0, + "step": 63960 + }, + { + "epoch": 0.5865040799486568, + "learning_rate": 8.270101769505822e-05, + "loss": 0.7006, + "mean_token_accuracy": 0.7836643159389496, + "num_tokens": 148828126.0, + "step": 63970 + }, + { + "epoch": 0.5865957641881361, + "learning_rate": 8.268268084716237e-05, + "loss": 0.6778, + "mean_token_accuracy": 0.7899862587451935, + "num_tokens": 148852811.0, + "step": 63980 + }, + { + "epoch": 0.5866874484276153, + "learning_rate": 8.266434399926652e-05, + "loss": 0.6866, + "mean_token_accuracy": 0.7958472669124603, + "num_tokens": 148877989.0, + "step": 63990 + }, + { + "epoch": 0.5867791326670945, + "learning_rate": 8.264600715137069e-05, + "loss": 0.7003, + "mean_token_accuracy": 0.7905132412910462, + "num_tokens": 148903389.0, + "step": 64000 + }, + { + "epoch": 0.5868708169065737, + "learning_rate": 8.262767030347484e-05, + "loss": 0.7212, + "mean_token_accuracy": 0.7804872572422028, + "num_tokens": 148928501.0, + "step": 64010 + }, + { + "epoch": 0.586962501146053, + "learning_rate": 8.260933345557898e-05, + "loss": 0.7057, + "mean_token_accuracy": 0.7765512049198151, + "num_tokens": 148953804.0, + "step": 64020 + }, + { + "epoch": 0.5870541853855322, + "learning_rate": 8.259099660768315e-05, + "loss": 0.7128, + "mean_token_accuracy": 0.7861216723918915, + "num_tokens": 148979129.0, + "step": 64030 + }, + { + "epoch": 0.5871458696250115, + "learning_rate": 8.25726597597873e-05, + "loss": 0.7306, + "mean_token_accuracy": 0.775581157207489, + "num_tokens": 149003538.0, + "step": 64040 + }, + { + "epoch": 0.5872375538644907, + "learning_rate": 8.255432291189145e-05, + "loss": 0.6787, + "mean_token_accuracy": 0.7887977957725525, + "num_tokens": 149028401.0, + "step": 64050 + }, + { + "epoch": 0.58732923810397, + "learning_rate": 8.25359860639956e-05, + "loss": 0.6916, + "mean_token_accuracy": 0.7851101934909821, + "num_tokens": 149053731.0, + "step": 64060 + }, + { + "epoch": 0.5874209223434491, + "learning_rate": 8.251764921609975e-05, + "loss": 0.6748, + "mean_token_accuracy": 0.7852842628955841, + "num_tokens": 149079284.0, + "step": 64070 + }, + { + "epoch": 0.5875126065829284, + "learning_rate": 8.24993123682039e-05, + "loss": 0.676, + "mean_token_accuracy": 0.7941822052001953, + "num_tokens": 149104286.0, + "step": 64080 + }, + { + "epoch": 0.5876042908224076, + "learning_rate": 8.248097552030807e-05, + "loss": 0.7135, + "mean_token_accuracy": 0.7870282888412475, + "num_tokens": 149129240.0, + "step": 64090 + }, + { + "epoch": 0.5876959750618869, + "learning_rate": 8.246263867241222e-05, + "loss": 0.7072, + "mean_token_accuracy": 0.7809190571308136, + "num_tokens": 149154121.0, + "step": 64100 + }, + { + "epoch": 0.5877876593013661, + "learning_rate": 8.244430182451637e-05, + "loss": 0.703, + "mean_token_accuracy": 0.7839613497257233, + "num_tokens": 149179463.0, + "step": 64110 + }, + { + "epoch": 0.5878793435408454, + "learning_rate": 8.242596497662051e-05, + "loss": 0.7044, + "mean_token_accuracy": 0.7832949101924896, + "num_tokens": 149204670.0, + "step": 64120 + }, + { + "epoch": 0.5879710277803246, + "learning_rate": 8.240762812872468e-05, + "loss": 0.6786, + "mean_token_accuracy": 0.7926870584487915, + "num_tokens": 149230302.0, + "step": 64130 + }, + { + "epoch": 0.5880627120198038, + "learning_rate": 8.238929128082883e-05, + "loss": 0.7348, + "mean_token_accuracy": 0.7770215153694153, + "num_tokens": 149255432.0, + "step": 64140 + }, + { + "epoch": 0.588154396259283, + "learning_rate": 8.237095443293298e-05, + "loss": 0.7225, + "mean_token_accuracy": 0.7816013813018798, + "num_tokens": 149280035.0, + "step": 64150 + }, + { + "epoch": 0.5882460804987623, + "learning_rate": 8.235261758503713e-05, + "loss": 0.6891, + "mean_token_accuracy": 0.784260493516922, + "num_tokens": 149305482.0, + "step": 64160 + }, + { + "epoch": 0.5883377647382415, + "learning_rate": 8.233428073714129e-05, + "loss": 0.6798, + "mean_token_accuracy": 0.7883141458034515, + "num_tokens": 149330366.0, + "step": 64170 + }, + { + "epoch": 0.5884294489777208, + "learning_rate": 8.231594388924544e-05, + "loss": 0.752, + "mean_token_accuracy": 0.7755284488201142, + "num_tokens": 149356050.0, + "step": 64180 + }, + { + "epoch": 0.5885211332172, + "learning_rate": 8.22976070413496e-05, + "loss": 0.6753, + "mean_token_accuracy": 0.7889199912548065, + "num_tokens": 149380828.0, + "step": 64190 + }, + { + "epoch": 0.5886128174566791, + "learning_rate": 8.227927019345375e-05, + "loss": 0.6886, + "mean_token_accuracy": 0.7897959649562836, + "num_tokens": 149406675.0, + "step": 64200 + }, + { + "epoch": 0.5887045016961584, + "learning_rate": 8.22609333455579e-05, + "loss": 0.7024, + "mean_token_accuracy": 0.7864479064941406, + "num_tokens": 149431617.0, + "step": 64210 + }, + { + "epoch": 0.5887961859356377, + "learning_rate": 8.224259649766206e-05, + "loss": 0.6716, + "mean_token_accuracy": 0.7913666784763336, + "num_tokens": 149457665.0, + "step": 64220 + }, + { + "epoch": 0.5888878701751169, + "learning_rate": 8.222425964976621e-05, + "loss": 0.7335, + "mean_token_accuracy": 0.7786946952342987, + "num_tokens": 149482827.0, + "step": 64230 + }, + { + "epoch": 0.5889795544145962, + "learning_rate": 8.220592280187036e-05, + "loss": 0.7222, + "mean_token_accuracy": 0.7779923200607299, + "num_tokens": 149507331.0, + "step": 64240 + }, + { + "epoch": 0.5890712386540754, + "learning_rate": 8.218758595397451e-05, + "loss": 0.7003, + "mean_token_accuracy": 0.7880372524261474, + "num_tokens": 149532621.0, + "step": 64250 + }, + { + "epoch": 0.5891629228935547, + "learning_rate": 8.216924910607867e-05, + "loss": 0.7143, + "mean_token_accuracy": 0.7853023648262024, + "num_tokens": 149557682.0, + "step": 64260 + }, + { + "epoch": 0.5892546071330338, + "learning_rate": 8.215091225818282e-05, + "loss": 0.7574, + "mean_token_accuracy": 0.7721137225627899, + "num_tokens": 149583441.0, + "step": 64270 + }, + { + "epoch": 0.589346291372513, + "learning_rate": 8.213257541028697e-05, + "loss": 0.7037, + "mean_token_accuracy": 0.7882411360740662, + "num_tokens": 149608127.0, + "step": 64280 + }, + { + "epoch": 0.5894379756119923, + "learning_rate": 8.211423856239113e-05, + "loss": 0.7061, + "mean_token_accuracy": 0.7803534269332886, + "num_tokens": 149632863.0, + "step": 64290 + }, + { + "epoch": 0.5895296598514715, + "learning_rate": 8.209590171449529e-05, + "loss": 0.7187, + "mean_token_accuracy": 0.7781393647193908, + "num_tokens": 149658488.0, + "step": 64300 + }, + { + "epoch": 0.5896213440909508, + "learning_rate": 8.207756486659944e-05, + "loss": 0.6871, + "mean_token_accuracy": 0.7872996270656586, + "num_tokens": 149683311.0, + "step": 64310 + }, + { + "epoch": 0.58971302833043, + "learning_rate": 8.205922801870359e-05, + "loss": 0.6876, + "mean_token_accuracy": 0.7906221568584442, + "num_tokens": 149709057.0, + "step": 64320 + }, + { + "epoch": 0.5898047125699092, + "learning_rate": 8.204089117080774e-05, + "loss": 0.7203, + "mean_token_accuracy": 0.7827765464782714, + "num_tokens": 149733195.0, + "step": 64330 + }, + { + "epoch": 0.5898963968093884, + "learning_rate": 8.20225543229119e-05, + "loss": 0.694, + "mean_token_accuracy": 0.7838902354240418, + "num_tokens": 149757775.0, + "step": 64340 + }, + { + "epoch": 0.5899880810488677, + "learning_rate": 8.200421747501606e-05, + "loss": 0.7291, + "mean_token_accuracy": 0.7774064660072326, + "num_tokens": 149782232.0, + "step": 64350 + }, + { + "epoch": 0.5900797652883469, + "learning_rate": 8.19858806271202e-05, + "loss": 0.6934, + "mean_token_accuracy": 0.7859097242355346, + "num_tokens": 149807883.0, + "step": 64360 + }, + { + "epoch": 0.5901714495278262, + "learning_rate": 8.196754377922435e-05, + "loss": 0.7679, + "mean_token_accuracy": 0.7702005982398987, + "num_tokens": 149833750.0, + "step": 64370 + }, + { + "epoch": 0.5902631337673054, + "learning_rate": 8.19492069313285e-05, + "loss": 0.6779, + "mean_token_accuracy": 0.7937423825263977, + "num_tokens": 149858563.0, + "step": 64380 + }, + { + "epoch": 0.5903548180067847, + "learning_rate": 8.193087008343267e-05, + "loss": 0.7196, + "mean_token_accuracy": 0.7906647562980652, + "num_tokens": 149883174.0, + "step": 64390 + }, + { + "epoch": 0.5904465022462638, + "learning_rate": 8.191253323553682e-05, + "loss": 0.7145, + "mean_token_accuracy": 0.7835176408290863, + "num_tokens": 149907710.0, + "step": 64400 + }, + { + "epoch": 0.5905381864857431, + "learning_rate": 8.189419638764097e-05, + "loss": 0.6796, + "mean_token_accuracy": 0.7890723168849945, + "num_tokens": 149932311.0, + "step": 64410 + }, + { + "epoch": 0.5906298707252223, + "learning_rate": 8.187585953974512e-05, + "loss": 0.676, + "mean_token_accuracy": 0.7912966549396515, + "num_tokens": 149956459.0, + "step": 64420 + }, + { + "epoch": 0.5907215549647016, + "learning_rate": 8.185752269184927e-05, + "loss": 0.6672, + "mean_token_accuracy": 0.7880989968776703, + "num_tokens": 149981931.0, + "step": 64430 + }, + { + "epoch": 0.5908132392041808, + "learning_rate": 8.183918584395343e-05, + "loss": 0.704, + "mean_token_accuracy": 0.7908606708049775, + "num_tokens": 150007268.0, + "step": 64440 + }, + { + "epoch": 0.5909049234436601, + "learning_rate": 8.182084899605759e-05, + "loss": 0.6759, + "mean_token_accuracy": 0.7926512897014618, + "num_tokens": 150032489.0, + "step": 64450 + }, + { + "epoch": 0.5909966076831392, + "learning_rate": 8.180251214816173e-05, + "loss": 0.7026, + "mean_token_accuracy": 0.7807465970516205, + "num_tokens": 150057536.0, + "step": 64460 + }, + { + "epoch": 0.5910882919226185, + "learning_rate": 8.178417530026588e-05, + "loss": 0.7167, + "mean_token_accuracy": 0.7739458680152893, + "num_tokens": 150083170.0, + "step": 64470 + }, + { + "epoch": 0.5911799761620977, + "learning_rate": 8.176583845237003e-05, + "loss": 0.6609, + "mean_token_accuracy": 0.7943176209926606, + "num_tokens": 150108355.0, + "step": 64480 + }, + { + "epoch": 0.591271660401577, + "learning_rate": 8.17475016044742e-05, + "loss": 0.7059, + "mean_token_accuracy": 0.7872118592262268, + "num_tokens": 150133293.0, + "step": 64490 + }, + { + "epoch": 0.5913633446410562, + "learning_rate": 8.172916475657835e-05, + "loss": 0.7191, + "mean_token_accuracy": 0.7783481657505036, + "num_tokens": 150158436.0, + "step": 64500 + }, + { + "epoch": 0.5914550288805355, + "learning_rate": 8.17108279086825e-05, + "loss": 0.7325, + "mean_token_accuracy": 0.7804322838783264, + "num_tokens": 150183183.0, + "step": 64510 + }, + { + "epoch": 0.5915467131200147, + "learning_rate": 8.169249106078666e-05, + "loss": 0.6876, + "mean_token_accuracy": 0.7907378137111664, + "num_tokens": 150208272.0, + "step": 64520 + }, + { + "epoch": 0.5916383973594939, + "learning_rate": 8.167415421289081e-05, + "loss": 0.7189, + "mean_token_accuracy": 0.7767588555812835, + "num_tokens": 150232546.0, + "step": 64530 + }, + { + "epoch": 0.5917300815989731, + "learning_rate": 8.165581736499496e-05, + "loss": 0.7075, + "mean_token_accuracy": 0.7842768251895904, + "num_tokens": 150257428.0, + "step": 64540 + }, + { + "epoch": 0.5918217658384524, + "learning_rate": 8.163748051709912e-05, + "loss": 0.6866, + "mean_token_accuracy": 0.7891097903251648, + "num_tokens": 150282125.0, + "step": 64550 + }, + { + "epoch": 0.5919134500779316, + "learning_rate": 8.161914366920326e-05, + "loss": 0.7235, + "mean_token_accuracy": 0.7783652007579803, + "num_tokens": 150307180.0, + "step": 64560 + }, + { + "epoch": 0.5920051343174109, + "learning_rate": 8.160080682130741e-05, + "loss": 0.6768, + "mean_token_accuracy": 0.7973542153835297, + "num_tokens": 150332280.0, + "step": 64570 + }, + { + "epoch": 0.5920968185568901, + "learning_rate": 8.158246997341158e-05, + "loss": 0.7015, + "mean_token_accuracy": 0.7862518548965454, + "num_tokens": 150357272.0, + "step": 64580 + }, + { + "epoch": 0.5921885027963693, + "learning_rate": 8.156413312551573e-05, + "loss": 0.7327, + "mean_token_accuracy": 0.7767649173736573, + "num_tokens": 150382115.0, + "step": 64590 + }, + { + "epoch": 0.5922801870358485, + "learning_rate": 8.154579627761988e-05, + "loss": 0.7009, + "mean_token_accuracy": 0.788267582654953, + "num_tokens": 150405832.0, + "step": 64600 + }, + { + "epoch": 0.5923718712753278, + "learning_rate": 8.152745942972404e-05, + "loss": 0.6938, + "mean_token_accuracy": 0.7892520785331726, + "num_tokens": 150430587.0, + "step": 64610 + }, + { + "epoch": 0.592463555514807, + "learning_rate": 8.150912258182819e-05, + "loss": 0.7184, + "mean_token_accuracy": 0.7759264647960663, + "num_tokens": 150455270.0, + "step": 64620 + }, + { + "epoch": 0.5925552397542863, + "learning_rate": 8.149078573393234e-05, + "loss": 0.6988, + "mean_token_accuracy": 0.7858653008937836, + "num_tokens": 150480147.0, + "step": 64630 + }, + { + "epoch": 0.5926469239937655, + "learning_rate": 8.147244888603649e-05, + "loss": 0.721, + "mean_token_accuracy": 0.7873132884502411, + "num_tokens": 150504742.0, + "step": 64640 + }, + { + "epoch": 0.5927386082332448, + "learning_rate": 8.145411203814066e-05, + "loss": 0.7336, + "mean_token_accuracy": 0.7803522884845734, + "num_tokens": 150529394.0, + "step": 64650 + }, + { + "epoch": 0.5928302924727239, + "learning_rate": 8.14357751902448e-05, + "loss": 0.699, + "mean_token_accuracy": 0.7888843536376953, + "num_tokens": 150554556.0, + "step": 64660 + }, + { + "epoch": 0.5929219767122031, + "learning_rate": 8.141743834234895e-05, + "loss": 0.6712, + "mean_token_accuracy": 0.7859473407268525, + "num_tokens": 150579300.0, + "step": 64670 + }, + { + "epoch": 0.5930136609516824, + "learning_rate": 8.139910149445311e-05, + "loss": 0.6879, + "mean_token_accuracy": 0.7903903961181641, + "num_tokens": 150605010.0, + "step": 64680 + }, + { + "epoch": 0.5931053451911616, + "learning_rate": 8.138076464655726e-05, + "loss": 0.6907, + "mean_token_accuracy": 0.7918246030807495, + "num_tokens": 150630010.0, + "step": 64690 + }, + { + "epoch": 0.5931970294306409, + "learning_rate": 8.136242779866142e-05, + "loss": 0.6718, + "mean_token_accuracy": 0.7947119235992431, + "num_tokens": 150654790.0, + "step": 64700 + }, + { + "epoch": 0.5932887136701201, + "learning_rate": 8.134409095076557e-05, + "loss": 0.7054, + "mean_token_accuracy": 0.7794699013233185, + "num_tokens": 150680688.0, + "step": 64710 + }, + { + "epoch": 0.5933803979095993, + "learning_rate": 8.132575410286972e-05, + "loss": 0.6995, + "mean_token_accuracy": 0.7933349549770355, + "num_tokens": 150705217.0, + "step": 64720 + }, + { + "epoch": 0.5934720821490785, + "learning_rate": 8.130741725497387e-05, + "loss": 0.7355, + "mean_token_accuracy": 0.7805914580821991, + "num_tokens": 150731051.0, + "step": 64730 + }, + { + "epoch": 0.5935637663885578, + "learning_rate": 8.128908040707802e-05, + "loss": 0.6802, + "mean_token_accuracy": 0.7900279283523559, + "num_tokens": 150755700.0, + "step": 64740 + }, + { + "epoch": 0.593655450628037, + "learning_rate": 8.127074355918219e-05, + "loss": 0.6721, + "mean_token_accuracy": 0.7904886305332184, + "num_tokens": 150780723.0, + "step": 64750 + }, + { + "epoch": 0.5937471348675163, + "learning_rate": 8.125240671128633e-05, + "loss": 0.7406, + "mean_token_accuracy": 0.7759748756885528, + "num_tokens": 150806416.0, + "step": 64760 + }, + { + "epoch": 0.5938388191069955, + "learning_rate": 8.123406986339048e-05, + "loss": 0.7001, + "mean_token_accuracy": 0.7837151050567627, + "num_tokens": 150832653.0, + "step": 64770 + }, + { + "epoch": 0.5939305033464748, + "learning_rate": 8.121573301549464e-05, + "loss": 0.7388, + "mean_token_accuracy": 0.7705853223800659, + "num_tokens": 150857682.0, + "step": 64780 + }, + { + "epoch": 0.5940221875859539, + "learning_rate": 8.11973961675988e-05, + "loss": 0.6735, + "mean_token_accuracy": 0.7909241139888763, + "num_tokens": 150883588.0, + "step": 64790 + }, + { + "epoch": 0.5941138718254332, + "learning_rate": 8.117905931970295e-05, + "loss": 0.712, + "mean_token_accuracy": 0.7861241042613983, + "num_tokens": 150908475.0, + "step": 64800 + }, + { + "epoch": 0.5942055560649124, + "learning_rate": 8.11607224718071e-05, + "loss": 0.6678, + "mean_token_accuracy": 0.7927547752857208, + "num_tokens": 150933485.0, + "step": 64810 + }, + { + "epoch": 0.5942972403043917, + "learning_rate": 8.114238562391125e-05, + "loss": 0.7102, + "mean_token_accuracy": 0.7864205956459045, + "num_tokens": 150958465.0, + "step": 64820 + }, + { + "epoch": 0.5943889245438709, + "learning_rate": 8.11240487760154e-05, + "loss": 0.677, + "mean_token_accuracy": 0.7920351564884186, + "num_tokens": 150983351.0, + "step": 64830 + }, + { + "epoch": 0.5944806087833502, + "learning_rate": 8.110571192811957e-05, + "loss": 0.6978, + "mean_token_accuracy": 0.7859266996383667, + "num_tokens": 151008309.0, + "step": 64840 + }, + { + "epoch": 0.5945722930228293, + "learning_rate": 8.108737508022372e-05, + "loss": 0.6822, + "mean_token_accuracy": 0.7874178767204285, + "num_tokens": 151032966.0, + "step": 64850 + }, + { + "epoch": 0.5946639772623086, + "learning_rate": 8.106903823232786e-05, + "loss": 0.6714, + "mean_token_accuracy": 0.7888278841972352, + "num_tokens": 151057177.0, + "step": 64860 + }, + { + "epoch": 0.5947556615017878, + "learning_rate": 8.105070138443201e-05, + "loss": 0.712, + "mean_token_accuracy": 0.7801290571689605, + "num_tokens": 151082202.0, + "step": 64870 + }, + { + "epoch": 0.5948473457412671, + "learning_rate": 8.103236453653618e-05, + "loss": 0.7165, + "mean_token_accuracy": 0.7849847555160523, + "num_tokens": 151107226.0, + "step": 64880 + }, + { + "epoch": 0.5949390299807463, + "learning_rate": 8.101402768864033e-05, + "loss": 0.7182, + "mean_token_accuracy": 0.7808296024799347, + "num_tokens": 151132624.0, + "step": 64890 + }, + { + "epoch": 0.5950307142202256, + "learning_rate": 8.099569084074448e-05, + "loss": 0.6896, + "mean_token_accuracy": 0.7926852285861969, + "num_tokens": 151158280.0, + "step": 64900 + }, + { + "epoch": 0.5951223984597048, + "learning_rate": 8.097735399284863e-05, + "loss": 0.6973, + "mean_token_accuracy": 0.7888705492019653, + "num_tokens": 151183554.0, + "step": 64910 + }, + { + "epoch": 0.595214082699184, + "learning_rate": 8.095901714495278e-05, + "loss": 0.6543, + "mean_token_accuracy": 0.7970582187175751, + "num_tokens": 151208225.0, + "step": 64920 + }, + { + "epoch": 0.5953057669386632, + "learning_rate": 8.094068029705694e-05, + "loss": 0.6996, + "mean_token_accuracy": 0.7853852927684783, + "num_tokens": 151233791.0, + "step": 64930 + }, + { + "epoch": 0.5953974511781425, + "learning_rate": 8.09223434491611e-05, + "loss": 0.6992, + "mean_token_accuracy": 0.7901147663593292, + "num_tokens": 151258661.0, + "step": 64940 + }, + { + "epoch": 0.5954891354176217, + "learning_rate": 8.090400660126525e-05, + "loss": 0.6817, + "mean_token_accuracy": 0.7880674540996552, + "num_tokens": 151283145.0, + "step": 64950 + }, + { + "epoch": 0.595580819657101, + "learning_rate": 8.088566975336939e-05, + "loss": 0.6976, + "mean_token_accuracy": 0.7901171863079071, + "num_tokens": 151307149.0, + "step": 64960 + }, + { + "epoch": 0.5956725038965802, + "learning_rate": 8.086733290547356e-05, + "loss": 0.6381, + "mean_token_accuracy": 0.8069639921188354, + "num_tokens": 151332250.0, + "step": 64970 + }, + { + "epoch": 0.5957641881360594, + "learning_rate": 8.084899605757771e-05, + "loss": 0.6729, + "mean_token_accuracy": 0.7924875020980835, + "num_tokens": 151356917.0, + "step": 64980 + }, + { + "epoch": 0.5958558723755386, + "learning_rate": 8.083065920968186e-05, + "loss": 0.6723, + "mean_token_accuracy": 0.7953984498977661, + "num_tokens": 151381471.0, + "step": 64990 + }, + { + "epoch": 0.5959475566150179, + "learning_rate": 8.081232236178601e-05, + "loss": 0.721, + "mean_token_accuracy": 0.779432862997055, + "num_tokens": 151405820.0, + "step": 65000 + }, + { + "epoch": 0.5960392408544971, + "learning_rate": 8.079398551389016e-05, + "loss": 0.704, + "mean_token_accuracy": 0.7881818771362304, + "num_tokens": 151431025.0, + "step": 65010 + }, + { + "epoch": 0.5961309250939764, + "learning_rate": 8.077564866599432e-05, + "loss": 0.6858, + "mean_token_accuracy": 0.7907904803752899, + "num_tokens": 151455337.0, + "step": 65020 + }, + { + "epoch": 0.5962226093334556, + "learning_rate": 8.075731181809847e-05, + "loss": 0.674, + "mean_token_accuracy": 0.7922715544700623, + "num_tokens": 151479919.0, + "step": 65030 + }, + { + "epoch": 0.5963142935729349, + "learning_rate": 8.073897497020263e-05, + "loss": 0.689, + "mean_token_accuracy": 0.7919419050216675, + "num_tokens": 151505252.0, + "step": 65040 + }, + { + "epoch": 0.596405977812414, + "learning_rate": 8.072063812230679e-05, + "loss": 0.6699, + "mean_token_accuracy": 0.7882711529731751, + "num_tokens": 151530038.0, + "step": 65050 + }, + { + "epoch": 0.5964976620518933, + "learning_rate": 8.070230127441092e-05, + "loss": 0.7049, + "mean_token_accuracy": 0.7847719013690948, + "num_tokens": 151555326.0, + "step": 65060 + }, + { + "epoch": 0.5965893462913725, + "learning_rate": 8.068396442651509e-05, + "loss": 0.7061, + "mean_token_accuracy": 0.7804329514503479, + "num_tokens": 151580855.0, + "step": 65070 + }, + { + "epoch": 0.5966810305308518, + "learning_rate": 8.066562757861924e-05, + "loss": 0.7034, + "mean_token_accuracy": 0.7878237545490265, + "num_tokens": 151605551.0, + "step": 65080 + }, + { + "epoch": 0.596772714770331, + "learning_rate": 8.064729073072339e-05, + "loss": 0.706, + "mean_token_accuracy": 0.7816583752632141, + "num_tokens": 151629801.0, + "step": 65090 + }, + { + "epoch": 0.5968643990098103, + "learning_rate": 8.062895388282754e-05, + "loss": 0.6935, + "mean_token_accuracy": 0.7866775929927826, + "num_tokens": 151655179.0, + "step": 65100 + }, + { + "epoch": 0.5969560832492894, + "learning_rate": 8.06106170349317e-05, + "loss": 0.6813, + "mean_token_accuracy": 0.79028679728508, + "num_tokens": 151680104.0, + "step": 65110 + }, + { + "epoch": 0.5970477674887686, + "learning_rate": 8.059228018703585e-05, + "loss": 0.6809, + "mean_token_accuracy": 0.7855668783187866, + "num_tokens": 151705046.0, + "step": 65120 + }, + { + "epoch": 0.5971394517282479, + "learning_rate": 8.057394333914e-05, + "loss": 0.7323, + "mean_token_accuracy": 0.7846117556095124, + "num_tokens": 151729319.0, + "step": 65130 + }, + { + "epoch": 0.5972311359677271, + "learning_rate": 8.055560649124417e-05, + "loss": 0.7051, + "mean_token_accuracy": 0.7806686639785767, + "num_tokens": 151754957.0, + "step": 65140 + }, + { + "epoch": 0.5973228202072064, + "learning_rate": 8.053726964334832e-05, + "loss": 0.6877, + "mean_token_accuracy": 0.7896865606307983, + "num_tokens": 151779890.0, + "step": 65150 + }, + { + "epoch": 0.5974145044466856, + "learning_rate": 8.051893279545246e-05, + "loss": 0.6815, + "mean_token_accuracy": 0.7892807781696319, + "num_tokens": 151804724.0, + "step": 65160 + }, + { + "epoch": 0.5975061886861649, + "learning_rate": 8.050059594755662e-05, + "loss": 0.728, + "mean_token_accuracy": 0.7809356033802033, + "num_tokens": 151830000.0, + "step": 65170 + }, + { + "epoch": 0.597597872925644, + "learning_rate": 8.048225909966077e-05, + "loss": 0.6906, + "mean_token_accuracy": 0.7841889500617981, + "num_tokens": 151855194.0, + "step": 65180 + }, + { + "epoch": 0.5976895571651233, + "learning_rate": 8.046392225176492e-05, + "loss": 0.6852, + "mean_token_accuracy": 0.7840856671333313, + "num_tokens": 151879696.0, + "step": 65190 + }, + { + "epoch": 0.5977812414046025, + "learning_rate": 8.044558540386909e-05, + "loss": 0.6867, + "mean_token_accuracy": 0.7938149988651275, + "num_tokens": 151904775.0, + "step": 65200 + }, + { + "epoch": 0.5978729256440818, + "learning_rate": 8.042724855597323e-05, + "loss": 0.683, + "mean_token_accuracy": 0.7929098248481751, + "num_tokens": 151930309.0, + "step": 65210 + }, + { + "epoch": 0.597964609883561, + "learning_rate": 8.040891170807738e-05, + "loss": 0.6739, + "mean_token_accuracy": 0.785862410068512, + "num_tokens": 151955790.0, + "step": 65220 + }, + { + "epoch": 0.5980562941230403, + "learning_rate": 8.039057486018153e-05, + "loss": 0.676, + "mean_token_accuracy": 0.7941699206829071, + "num_tokens": 151981094.0, + "step": 65230 + }, + { + "epoch": 0.5981479783625194, + "learning_rate": 8.03722380122857e-05, + "loss": 0.6917, + "mean_token_accuracy": 0.793646776676178, + "num_tokens": 152005920.0, + "step": 65240 + }, + { + "epoch": 0.5982396626019987, + "learning_rate": 8.035390116438985e-05, + "loss": 0.6736, + "mean_token_accuracy": 0.7904787123203277, + "num_tokens": 152031097.0, + "step": 65250 + }, + { + "epoch": 0.5983313468414779, + "learning_rate": 8.033556431649399e-05, + "loss": 0.7083, + "mean_token_accuracy": 0.7841505885124207, + "num_tokens": 152055763.0, + "step": 65260 + }, + { + "epoch": 0.5984230310809572, + "learning_rate": 8.031722746859815e-05, + "loss": 0.6915, + "mean_token_accuracy": 0.7877865970134735, + "num_tokens": 152079670.0, + "step": 65270 + }, + { + "epoch": 0.5985147153204364, + "learning_rate": 8.02988906207023e-05, + "loss": 0.7102, + "mean_token_accuracy": 0.7813880145549774, + "num_tokens": 152104967.0, + "step": 65280 + }, + { + "epoch": 0.5986063995599157, + "learning_rate": 8.028055377280646e-05, + "loss": 0.6715, + "mean_token_accuracy": 0.7874277710914612, + "num_tokens": 152129490.0, + "step": 65290 + }, + { + "epoch": 0.5986980837993949, + "learning_rate": 8.026221692491062e-05, + "loss": 0.6921, + "mean_token_accuracy": 0.786574387550354, + "num_tokens": 152155020.0, + "step": 65300 + }, + { + "epoch": 0.5987897680388741, + "learning_rate": 8.024388007701476e-05, + "loss": 0.7322, + "mean_token_accuracy": 0.7764752984046936, + "num_tokens": 152180178.0, + "step": 65310 + }, + { + "epoch": 0.5988814522783533, + "learning_rate": 8.022554322911891e-05, + "loss": 0.6781, + "mean_token_accuracy": 0.787101149559021, + "num_tokens": 152204476.0, + "step": 65320 + }, + { + "epoch": 0.5989731365178326, + "learning_rate": 8.020720638122308e-05, + "loss": 0.7171, + "mean_token_accuracy": 0.7777836680412292, + "num_tokens": 152230885.0, + "step": 65330 + }, + { + "epoch": 0.5990648207573118, + "learning_rate": 8.018886953332723e-05, + "loss": 0.6962, + "mean_token_accuracy": 0.7864459693431854, + "num_tokens": 152256924.0, + "step": 65340 + }, + { + "epoch": 0.5991565049967911, + "learning_rate": 8.017053268543138e-05, + "loss": 0.6956, + "mean_token_accuracy": 0.7886278092861175, + "num_tokens": 152281849.0, + "step": 65350 + }, + { + "epoch": 0.5992481892362703, + "learning_rate": 8.015219583753552e-05, + "loss": 0.6831, + "mean_token_accuracy": 0.7853272080421447, + "num_tokens": 152306272.0, + "step": 65360 + }, + { + "epoch": 0.5993398734757496, + "learning_rate": 8.013385898963969e-05, + "loss": 0.7205, + "mean_token_accuracy": 0.7834070980548858, + "num_tokens": 152331405.0, + "step": 65370 + }, + { + "epoch": 0.5994315577152287, + "learning_rate": 8.011552214174384e-05, + "loss": 0.7185, + "mean_token_accuracy": 0.7829317331314087, + "num_tokens": 152356810.0, + "step": 65380 + }, + { + "epoch": 0.599523241954708, + "learning_rate": 8.009718529384799e-05, + "loss": 0.7058, + "mean_token_accuracy": 0.7811625599861145, + "num_tokens": 152381447.0, + "step": 65390 + }, + { + "epoch": 0.5996149261941872, + "learning_rate": 8.007884844595215e-05, + "loss": 0.6892, + "mean_token_accuracy": 0.7936155915260314, + "num_tokens": 152406264.0, + "step": 65400 + }, + { + "epoch": 0.5997066104336665, + "learning_rate": 8.006051159805629e-05, + "loss": 0.6826, + "mean_token_accuracy": 0.7890279054641723, + "num_tokens": 152431032.0, + "step": 65410 + }, + { + "epoch": 0.5997982946731457, + "learning_rate": 8.004217475016045e-05, + "loss": 0.6958, + "mean_token_accuracy": 0.7899737179279327, + "num_tokens": 152456170.0, + "step": 65420 + }, + { + "epoch": 0.599889978912625, + "learning_rate": 8.002383790226461e-05, + "loss": 0.741, + "mean_token_accuracy": 0.7748258411884308, + "num_tokens": 152480781.0, + "step": 65430 + }, + { + "epoch": 0.5999816631521041, + "learning_rate": 8.000550105436876e-05, + "loss": 0.6455, + "mean_token_accuracy": 0.7952584981918335, + "num_tokens": 152505840.0, + "step": 65440 + }, + { + "epoch": 0.6000733473915834, + "learning_rate": 7.998716420647291e-05, + "loss": 0.7077, + "mean_token_accuracy": 0.7831570863723755, + "num_tokens": 152531592.0, + "step": 65450 + }, + { + "epoch": 0.6001650316310626, + "learning_rate": 7.996882735857707e-05, + "loss": 0.7068, + "mean_token_accuracy": 0.7849279761314392, + "num_tokens": 152556504.0, + "step": 65460 + }, + { + "epoch": 0.6002567158705419, + "learning_rate": 7.995049051068122e-05, + "loss": 0.7487, + "mean_token_accuracy": 0.7772552847862244, + "num_tokens": 152581558.0, + "step": 65470 + }, + { + "epoch": 0.6003484001100211, + "learning_rate": 7.993215366278537e-05, + "loss": 0.6702, + "mean_token_accuracy": 0.791909259557724, + "num_tokens": 152605845.0, + "step": 65480 + }, + { + "epoch": 0.6004400843495004, + "learning_rate": 7.991381681488952e-05, + "loss": 0.687, + "mean_token_accuracy": 0.7882726311683654, + "num_tokens": 152630447.0, + "step": 65490 + }, + { + "epoch": 0.6005317685889796, + "learning_rate": 7.989547996699369e-05, + "loss": 0.6964, + "mean_token_accuracy": 0.7861719489097595, + "num_tokens": 152656099.0, + "step": 65500 + }, + { + "epoch": 0.6006234528284587, + "learning_rate": 7.987714311909783e-05, + "loss": 0.6742, + "mean_token_accuracy": 0.7913962602615356, + "num_tokens": 152681331.0, + "step": 65510 + }, + { + "epoch": 0.600715137067938, + "learning_rate": 7.985880627120198e-05, + "loss": 0.7271, + "mean_token_accuracy": 0.776265412569046, + "num_tokens": 152706181.0, + "step": 65520 + }, + { + "epoch": 0.6008068213074172, + "learning_rate": 7.984046942330614e-05, + "loss": 0.6754, + "mean_token_accuracy": 0.7891752243041992, + "num_tokens": 152731027.0, + "step": 65530 + }, + { + "epoch": 0.6008985055468965, + "learning_rate": 7.98221325754103e-05, + "loss": 0.733, + "mean_token_accuracy": 0.7765580773353576, + "num_tokens": 152756104.0, + "step": 65540 + }, + { + "epoch": 0.6009901897863758, + "learning_rate": 7.980379572751445e-05, + "loss": 0.6609, + "mean_token_accuracy": 0.794046550989151, + "num_tokens": 152781495.0, + "step": 65550 + }, + { + "epoch": 0.601081874025855, + "learning_rate": 7.97854588796186e-05, + "loss": 0.679, + "mean_token_accuracy": 0.789538037776947, + "num_tokens": 152806749.0, + "step": 65560 + }, + { + "epoch": 0.6011735582653341, + "learning_rate": 7.976712203172275e-05, + "loss": 0.6738, + "mean_token_accuracy": 0.7955724179744721, + "num_tokens": 152832054.0, + "step": 65570 + }, + { + "epoch": 0.6012652425048134, + "learning_rate": 7.97487851838269e-05, + "loss": 0.7199, + "mean_token_accuracy": 0.7878151297569275, + "num_tokens": 152857367.0, + "step": 65580 + }, + { + "epoch": 0.6013569267442926, + "learning_rate": 7.973044833593107e-05, + "loss": 0.7094, + "mean_token_accuracy": 0.7771391034126282, + "num_tokens": 152881428.0, + "step": 65590 + }, + { + "epoch": 0.6014486109837719, + "learning_rate": 7.971211148803522e-05, + "loss": 0.6544, + "mean_token_accuracy": 0.7940707743167877, + "num_tokens": 152906365.0, + "step": 65600 + }, + { + "epoch": 0.6015402952232511, + "learning_rate": 7.969377464013936e-05, + "loss": 0.6791, + "mean_token_accuracy": 0.7848674297332764, + "num_tokens": 152932233.0, + "step": 65610 + }, + { + "epoch": 0.6016319794627304, + "learning_rate": 7.967543779224351e-05, + "loss": 0.6883, + "mean_token_accuracy": 0.7926348149776459, + "num_tokens": 152956550.0, + "step": 65620 + }, + { + "epoch": 0.6017236637022096, + "learning_rate": 7.965710094434767e-05, + "loss": 0.7123, + "mean_token_accuracy": 0.7827710986137391, + "num_tokens": 152982137.0, + "step": 65630 + }, + { + "epoch": 0.6018153479416888, + "learning_rate": 7.963876409645183e-05, + "loss": 0.7092, + "mean_token_accuracy": 0.782976770401001, + "num_tokens": 153008140.0, + "step": 65640 + }, + { + "epoch": 0.601907032181168, + "learning_rate": 7.962042724855598e-05, + "loss": 0.6876, + "mean_token_accuracy": 0.7896133840084076, + "num_tokens": 153033161.0, + "step": 65650 + }, + { + "epoch": 0.6019987164206473, + "learning_rate": 7.960209040066013e-05, + "loss": 0.701, + "mean_token_accuracy": 0.7877236247062683, + "num_tokens": 153058576.0, + "step": 65660 + }, + { + "epoch": 0.6020904006601265, + "learning_rate": 7.958375355276428e-05, + "loss": 0.7046, + "mean_token_accuracy": 0.7810765504837036, + "num_tokens": 153083607.0, + "step": 65670 + }, + { + "epoch": 0.6021820848996058, + "learning_rate": 7.956541670486843e-05, + "loss": 0.6827, + "mean_token_accuracy": 0.7892462730407714, + "num_tokens": 153109400.0, + "step": 65680 + }, + { + "epoch": 0.602273769139085, + "learning_rate": 7.95470798569726e-05, + "loss": 0.6888, + "mean_token_accuracy": 0.7928320884704589, + "num_tokens": 153134951.0, + "step": 65690 + }, + { + "epoch": 0.6023654533785642, + "learning_rate": 7.952874300907675e-05, + "loss": 0.6838, + "mean_token_accuracy": 0.7948405981063843, + "num_tokens": 153160933.0, + "step": 65700 + }, + { + "epoch": 0.6024571376180434, + "learning_rate": 7.951040616118089e-05, + "loss": 0.7027, + "mean_token_accuracy": 0.7873086512088776, + "num_tokens": 153186376.0, + "step": 65710 + }, + { + "epoch": 0.6025488218575227, + "learning_rate": 7.949206931328504e-05, + "loss": 0.6842, + "mean_token_accuracy": 0.790751975774765, + "num_tokens": 153212680.0, + "step": 65720 + }, + { + "epoch": 0.6026405060970019, + "learning_rate": 7.947373246538921e-05, + "loss": 0.6753, + "mean_token_accuracy": 0.7919830679893494, + "num_tokens": 153237542.0, + "step": 65730 + }, + { + "epoch": 0.6027321903364812, + "learning_rate": 7.945539561749336e-05, + "loss": 0.6947, + "mean_token_accuracy": 0.7838497817516327, + "num_tokens": 153262276.0, + "step": 65740 + }, + { + "epoch": 0.6028238745759604, + "learning_rate": 7.943705876959751e-05, + "loss": 0.6617, + "mean_token_accuracy": 0.791743528842926, + "num_tokens": 153287441.0, + "step": 65750 + }, + { + "epoch": 0.6029155588154397, + "learning_rate": 7.941872192170166e-05, + "loss": 0.7073, + "mean_token_accuracy": 0.7812867045402527, + "num_tokens": 153312416.0, + "step": 65760 + }, + { + "epoch": 0.6030072430549188, + "learning_rate": 7.940038507380581e-05, + "loss": 0.6934, + "mean_token_accuracy": 0.7891874372959137, + "num_tokens": 153338303.0, + "step": 65770 + }, + { + "epoch": 0.6030989272943981, + "learning_rate": 7.938204822590997e-05, + "loss": 0.6945, + "mean_token_accuracy": 0.7873879969120026, + "num_tokens": 153363072.0, + "step": 65780 + }, + { + "epoch": 0.6031906115338773, + "learning_rate": 7.936371137801413e-05, + "loss": 0.705, + "mean_token_accuracy": 0.7892035901546478, + "num_tokens": 153388420.0, + "step": 65790 + }, + { + "epoch": 0.6032822957733566, + "learning_rate": 7.934537453011828e-05, + "loss": 0.6981, + "mean_token_accuracy": 0.7878020882606507, + "num_tokens": 153413679.0, + "step": 65800 + }, + { + "epoch": 0.6033739800128358, + "learning_rate": 7.932703768222242e-05, + "loss": 0.7285, + "mean_token_accuracy": 0.7841762900352478, + "num_tokens": 153438648.0, + "step": 65810 + }, + { + "epoch": 0.6034656642523151, + "learning_rate": 7.930870083432659e-05, + "loss": 0.719, + "mean_token_accuracy": 0.779742956161499, + "num_tokens": 153462828.0, + "step": 65820 + }, + { + "epoch": 0.6035573484917942, + "learning_rate": 7.929036398643074e-05, + "loss": 0.6949, + "mean_token_accuracy": 0.7837848901748657, + "num_tokens": 153488382.0, + "step": 65830 + }, + { + "epoch": 0.6036490327312735, + "learning_rate": 7.927202713853489e-05, + "loss": 0.7072, + "mean_token_accuracy": 0.7886743426322937, + "num_tokens": 153512937.0, + "step": 65840 + }, + { + "epoch": 0.6037407169707527, + "learning_rate": 7.925369029063904e-05, + "loss": 0.6816, + "mean_token_accuracy": 0.7898770630359649, + "num_tokens": 153538815.0, + "step": 65850 + }, + { + "epoch": 0.603832401210232, + "learning_rate": 7.92353534427432e-05, + "loss": 0.7123, + "mean_token_accuracy": 0.7815713942050934, + "num_tokens": 153563671.0, + "step": 65860 + }, + { + "epoch": 0.6039240854497112, + "learning_rate": 7.921701659484735e-05, + "loss": 0.6893, + "mean_token_accuracy": 0.7910423338413238, + "num_tokens": 153588938.0, + "step": 65870 + }, + { + "epoch": 0.6040157696891905, + "learning_rate": 7.91986797469515e-05, + "loss": 0.6869, + "mean_token_accuracy": 0.7885134279727936, + "num_tokens": 153614313.0, + "step": 65880 + }, + { + "epoch": 0.6041074539286697, + "learning_rate": 7.918034289905566e-05, + "loss": 0.6876, + "mean_token_accuracy": 0.7845796167850494, + "num_tokens": 153638843.0, + "step": 65890 + }, + { + "epoch": 0.6041991381681489, + "learning_rate": 7.916200605115982e-05, + "loss": 0.6624, + "mean_token_accuracy": 0.7969128489494324, + "num_tokens": 153662982.0, + "step": 65900 + }, + { + "epoch": 0.6042908224076281, + "learning_rate": 7.914366920326395e-05, + "loss": 0.6855, + "mean_token_accuracy": 0.7880733489990235, + "num_tokens": 153688288.0, + "step": 65910 + }, + { + "epoch": 0.6043825066471074, + "learning_rate": 7.912533235536812e-05, + "loss": 0.6844, + "mean_token_accuracy": 0.7834518909454345, + "num_tokens": 153714107.0, + "step": 65920 + }, + { + "epoch": 0.6044741908865866, + "learning_rate": 7.910699550747227e-05, + "loss": 0.675, + "mean_token_accuracy": 0.7943445026874543, + "num_tokens": 153739601.0, + "step": 65930 + }, + { + "epoch": 0.6045658751260659, + "learning_rate": 7.908865865957642e-05, + "loss": 0.6808, + "mean_token_accuracy": 0.7905770540237427, + "num_tokens": 153764907.0, + "step": 65940 + }, + { + "epoch": 0.6046575593655451, + "learning_rate": 7.907032181168058e-05, + "loss": 0.6786, + "mean_token_accuracy": 0.7863018035888671, + "num_tokens": 153789890.0, + "step": 65950 + }, + { + "epoch": 0.6047492436050242, + "learning_rate": 7.905198496378473e-05, + "loss": 0.6935, + "mean_token_accuracy": 0.7891980350017548, + "num_tokens": 153814873.0, + "step": 65960 + }, + { + "epoch": 0.6048409278445035, + "learning_rate": 7.903364811588888e-05, + "loss": 0.6963, + "mean_token_accuracy": 0.7839482605457306, + "num_tokens": 153839615.0, + "step": 65970 + }, + { + "epoch": 0.6049326120839827, + "learning_rate": 7.901531126799303e-05, + "loss": 0.6444, + "mean_token_accuracy": 0.7941844642162323, + "num_tokens": 153865150.0, + "step": 65980 + }, + { + "epoch": 0.605024296323462, + "learning_rate": 7.89969744200972e-05, + "loss": 0.7063, + "mean_token_accuracy": 0.7747714757919312, + "num_tokens": 153890668.0, + "step": 65990 + }, + { + "epoch": 0.6051159805629412, + "learning_rate": 7.897863757220135e-05, + "loss": 0.7315, + "mean_token_accuracy": 0.7796947598457337, + "num_tokens": 153914890.0, + "step": 66000 + }, + { + "epoch": 0.6052076648024205, + "learning_rate": 7.896030072430549e-05, + "loss": 0.6805, + "mean_token_accuracy": 0.7874993741512298, + "num_tokens": 153940568.0, + "step": 66010 + }, + { + "epoch": 0.6052993490418997, + "learning_rate": 7.894196387640965e-05, + "loss": 0.672, + "mean_token_accuracy": 0.7885223090648651, + "num_tokens": 153966239.0, + "step": 66020 + }, + { + "epoch": 0.6053910332813789, + "learning_rate": 7.89236270285138e-05, + "loss": 0.6866, + "mean_token_accuracy": 0.792020708322525, + "num_tokens": 153991411.0, + "step": 66030 + }, + { + "epoch": 0.6054827175208581, + "learning_rate": 7.890529018061796e-05, + "loss": 0.7079, + "mean_token_accuracy": 0.7849093317985535, + "num_tokens": 154016435.0, + "step": 66040 + }, + { + "epoch": 0.6055744017603374, + "learning_rate": 7.888695333272211e-05, + "loss": 0.69, + "mean_token_accuracy": 0.7888876736164093, + "num_tokens": 154041285.0, + "step": 66050 + }, + { + "epoch": 0.6056660859998166, + "learning_rate": 7.886861648482626e-05, + "loss": 0.7135, + "mean_token_accuracy": 0.7864153563976288, + "num_tokens": 154066652.0, + "step": 66060 + }, + { + "epoch": 0.6057577702392959, + "learning_rate": 7.885027963693041e-05, + "loss": 0.6402, + "mean_token_accuracy": 0.7941450238227844, + "num_tokens": 154091648.0, + "step": 66070 + }, + { + "epoch": 0.6058494544787751, + "learning_rate": 7.883194278903458e-05, + "loss": 0.687, + "mean_token_accuracy": 0.789392215013504, + "num_tokens": 154115807.0, + "step": 66080 + }, + { + "epoch": 0.6059411387182543, + "learning_rate": 7.881360594113873e-05, + "loss": 0.7184, + "mean_token_accuracy": 0.7835983037948608, + "num_tokens": 154141467.0, + "step": 66090 + }, + { + "epoch": 0.6060328229577335, + "learning_rate": 7.879526909324288e-05, + "loss": 0.7087, + "mean_token_accuracy": 0.7765124142169952, + "num_tokens": 154166574.0, + "step": 66100 + }, + { + "epoch": 0.6061245071972128, + "learning_rate": 7.877693224534702e-05, + "loss": 0.6813, + "mean_token_accuracy": 0.7879556477069855, + "num_tokens": 154192557.0, + "step": 66110 + }, + { + "epoch": 0.606216191436692, + "learning_rate": 7.875859539745118e-05, + "loss": 0.7186, + "mean_token_accuracy": 0.7812003195285797, + "num_tokens": 154217456.0, + "step": 66120 + }, + { + "epoch": 0.6063078756761713, + "learning_rate": 7.874025854955534e-05, + "loss": 0.6783, + "mean_token_accuracy": 0.7895727813243866, + "num_tokens": 154241983.0, + "step": 66130 + }, + { + "epoch": 0.6063995599156505, + "learning_rate": 7.872192170165949e-05, + "loss": 0.72, + "mean_token_accuracy": 0.7837452471256257, + "num_tokens": 154267125.0, + "step": 66140 + }, + { + "epoch": 0.6064912441551298, + "learning_rate": 7.870358485376364e-05, + "loss": 0.6925, + "mean_token_accuracy": 0.7894594967365265, + "num_tokens": 154292480.0, + "step": 66150 + }, + { + "epoch": 0.6065829283946089, + "learning_rate": 7.868524800586779e-05, + "loss": 0.7277, + "mean_token_accuracy": 0.777235871553421, + "num_tokens": 154317003.0, + "step": 66160 + }, + { + "epoch": 0.6066746126340882, + "learning_rate": 7.866691115797194e-05, + "loss": 0.6992, + "mean_token_accuracy": 0.78583984375, + "num_tokens": 154341664.0, + "step": 66170 + }, + { + "epoch": 0.6067662968735674, + "learning_rate": 7.864857431007611e-05, + "loss": 0.6981, + "mean_token_accuracy": 0.7841795980930328, + "num_tokens": 154367685.0, + "step": 66180 + }, + { + "epoch": 0.6068579811130467, + "learning_rate": 7.863023746218026e-05, + "loss": 0.7056, + "mean_token_accuracy": 0.7853238999843597, + "num_tokens": 154392983.0, + "step": 66190 + }, + { + "epoch": 0.6069496653525259, + "learning_rate": 7.861190061428441e-05, + "loss": 0.662, + "mean_token_accuracy": 0.788264536857605, + "num_tokens": 154417989.0, + "step": 66200 + }, + { + "epoch": 0.6070413495920052, + "learning_rate": 7.859356376638856e-05, + "loss": 0.6915, + "mean_token_accuracy": 0.7927573800086976, + "num_tokens": 154442933.0, + "step": 66210 + }, + { + "epoch": 0.6071330338314843, + "learning_rate": 7.857522691849272e-05, + "loss": 0.6847, + "mean_token_accuracy": 0.7889310359954834, + "num_tokens": 154468468.0, + "step": 66220 + }, + { + "epoch": 0.6072247180709636, + "learning_rate": 7.855689007059687e-05, + "loss": 0.711, + "mean_token_accuracy": 0.781570988893509, + "num_tokens": 154494333.0, + "step": 66230 + }, + { + "epoch": 0.6073164023104428, + "learning_rate": 7.853855322270102e-05, + "loss": 0.7277, + "mean_token_accuracy": 0.7829683005809784, + "num_tokens": 154518972.0, + "step": 66240 + }, + { + "epoch": 0.6074080865499221, + "learning_rate": 7.852021637480517e-05, + "loss": 0.6766, + "mean_token_accuracy": 0.7889496207237243, + "num_tokens": 154544166.0, + "step": 66250 + }, + { + "epoch": 0.6074997707894013, + "learning_rate": 7.850187952690932e-05, + "loss": 0.6857, + "mean_token_accuracy": 0.787873649597168, + "num_tokens": 154569209.0, + "step": 66260 + }, + { + "epoch": 0.6075914550288806, + "learning_rate": 7.848354267901348e-05, + "loss": 0.6607, + "mean_token_accuracy": 0.7953478693962097, + "num_tokens": 154595147.0, + "step": 66270 + }, + { + "epoch": 0.6076831392683598, + "learning_rate": 7.846520583111764e-05, + "loss": 0.6955, + "mean_token_accuracy": 0.786862713098526, + "num_tokens": 154620154.0, + "step": 66280 + }, + { + "epoch": 0.607774823507839, + "learning_rate": 7.844686898322179e-05, + "loss": 0.6978, + "mean_token_accuracy": 0.7850846529006958, + "num_tokens": 154646012.0, + "step": 66290 + }, + { + "epoch": 0.6078665077473182, + "learning_rate": 7.842853213532594e-05, + "loss": 0.6983, + "mean_token_accuracy": 0.7846573770046235, + "num_tokens": 154670715.0, + "step": 66300 + }, + { + "epoch": 0.6079581919867975, + "learning_rate": 7.84101952874301e-05, + "loss": 0.6838, + "mean_token_accuracy": 0.7916235387325287, + "num_tokens": 154695808.0, + "step": 66310 + }, + { + "epoch": 0.6080498762262767, + "learning_rate": 7.839185843953425e-05, + "loss": 0.7, + "mean_token_accuracy": 0.7809223353862762, + "num_tokens": 154720924.0, + "step": 66320 + }, + { + "epoch": 0.608141560465756, + "learning_rate": 7.83735215916384e-05, + "loss": 0.6847, + "mean_token_accuracy": 0.7868905007839203, + "num_tokens": 154746165.0, + "step": 66330 + }, + { + "epoch": 0.6082332447052352, + "learning_rate": 7.835518474374255e-05, + "loss": 0.6847, + "mean_token_accuracy": 0.7884917736053467, + "num_tokens": 154770724.0, + "step": 66340 + }, + { + "epoch": 0.6083249289447143, + "learning_rate": 7.83368478958467e-05, + "loss": 0.6779, + "mean_token_accuracy": 0.7910633623600006, + "num_tokens": 154795434.0, + "step": 66350 + }, + { + "epoch": 0.6084166131841936, + "learning_rate": 7.831851104795086e-05, + "loss": 0.7047, + "mean_token_accuracy": 0.7864468812942504, + "num_tokens": 154820367.0, + "step": 66360 + }, + { + "epoch": 0.6085082974236729, + "learning_rate": 7.830017420005501e-05, + "loss": 0.7404, + "mean_token_accuracy": 0.774083936214447, + "num_tokens": 154845031.0, + "step": 66370 + }, + { + "epoch": 0.6085999816631521, + "learning_rate": 7.828183735215917e-05, + "loss": 0.705, + "mean_token_accuracy": 0.7764290571212769, + "num_tokens": 154870638.0, + "step": 66380 + }, + { + "epoch": 0.6086916659026314, + "learning_rate": 7.826350050426333e-05, + "loss": 0.7305, + "mean_token_accuracy": 0.7796914041042328, + "num_tokens": 154894919.0, + "step": 66390 + }, + { + "epoch": 0.6087833501421106, + "learning_rate": 7.824516365636748e-05, + "loss": 0.6968, + "mean_token_accuracy": 0.786124074459076, + "num_tokens": 154920073.0, + "step": 66400 + }, + { + "epoch": 0.6088750343815899, + "learning_rate": 7.822682680847163e-05, + "loss": 0.7448, + "mean_token_accuracy": 0.7776680946350097, + "num_tokens": 154945245.0, + "step": 66410 + }, + { + "epoch": 0.608966718621069, + "learning_rate": 7.820848996057578e-05, + "loss": 0.7104, + "mean_token_accuracy": 0.789386659860611, + "num_tokens": 154970398.0, + "step": 66420 + }, + { + "epoch": 0.6090584028605482, + "learning_rate": 7.819015311267993e-05, + "loss": 0.6997, + "mean_token_accuracy": 0.7849281609058381, + "num_tokens": 154995479.0, + "step": 66430 + }, + { + "epoch": 0.6091500871000275, + "learning_rate": 7.81718162647841e-05, + "loss": 0.7237, + "mean_token_accuracy": 0.7780871987342834, + "num_tokens": 155019548.0, + "step": 66440 + }, + { + "epoch": 0.6092417713395067, + "learning_rate": 7.815347941688824e-05, + "loss": 0.7068, + "mean_token_accuracy": 0.7843786537647247, + "num_tokens": 155044277.0, + "step": 66450 + }, + { + "epoch": 0.609333455578986, + "learning_rate": 7.813514256899239e-05, + "loss": 0.6721, + "mean_token_accuracy": 0.7907335042953492, + "num_tokens": 155069265.0, + "step": 66460 + }, + { + "epoch": 0.6094251398184652, + "learning_rate": 7.811680572109654e-05, + "loss": 0.6991, + "mean_token_accuracy": 0.7900092720985412, + "num_tokens": 155093391.0, + "step": 66470 + }, + { + "epoch": 0.6095168240579444, + "learning_rate": 7.80984688732007e-05, + "loss": 0.6776, + "mean_token_accuracy": 0.79387868642807, + "num_tokens": 155118283.0, + "step": 66480 + }, + { + "epoch": 0.6096085082974236, + "learning_rate": 7.808013202530486e-05, + "loss": 0.7238, + "mean_token_accuracy": 0.7838686764240265, + "num_tokens": 155143267.0, + "step": 66490 + }, + { + "epoch": 0.6097001925369029, + "learning_rate": 7.806179517740901e-05, + "loss": 0.6896, + "mean_token_accuracy": 0.7886497557163239, + "num_tokens": 155169101.0, + "step": 66500 + }, + { + "epoch": 0.6097918767763821, + "learning_rate": 7.804345832951316e-05, + "loss": 0.7015, + "mean_token_accuracy": 0.78909552693367, + "num_tokens": 155194197.0, + "step": 66510 + }, + { + "epoch": 0.6098835610158614, + "learning_rate": 7.802512148161731e-05, + "loss": 0.7024, + "mean_token_accuracy": 0.7856522023677825, + "num_tokens": 155218838.0, + "step": 66520 + }, + { + "epoch": 0.6099752452553406, + "learning_rate": 7.800678463372146e-05, + "loss": 0.6838, + "mean_token_accuracy": 0.781846672296524, + "num_tokens": 155244430.0, + "step": 66530 + }, + { + "epoch": 0.6100669294948199, + "learning_rate": 7.798844778582563e-05, + "loss": 0.71, + "mean_token_accuracy": 0.7862145066261291, + "num_tokens": 155269316.0, + "step": 66540 + }, + { + "epoch": 0.610158613734299, + "learning_rate": 7.797011093792977e-05, + "loss": 0.6943, + "mean_token_accuracy": 0.7887844622135163, + "num_tokens": 155294074.0, + "step": 66550 + }, + { + "epoch": 0.6102502979737783, + "learning_rate": 7.795177409003392e-05, + "loss": 0.6874, + "mean_token_accuracy": 0.7871222496032715, + "num_tokens": 155319491.0, + "step": 66560 + }, + { + "epoch": 0.6103419822132575, + "learning_rate": 7.793343724213809e-05, + "loss": 0.6749, + "mean_token_accuracy": 0.7936574578285217, + "num_tokens": 155344162.0, + "step": 66570 + }, + { + "epoch": 0.6104336664527368, + "learning_rate": 7.791510039424224e-05, + "loss": 0.7191, + "mean_token_accuracy": 0.7807522296905518, + "num_tokens": 155369480.0, + "step": 66580 + }, + { + "epoch": 0.610525350692216, + "learning_rate": 7.789676354634639e-05, + "loss": 0.7317, + "mean_token_accuracy": 0.7801062822341919, + "num_tokens": 155394359.0, + "step": 66590 + }, + { + "epoch": 0.6106170349316953, + "learning_rate": 7.787842669845054e-05, + "loss": 0.7029, + "mean_token_accuracy": 0.7821816086769104, + "num_tokens": 155420199.0, + "step": 66600 + }, + { + "epoch": 0.6107087191711745, + "learning_rate": 7.78600898505547e-05, + "loss": 0.6847, + "mean_token_accuracy": 0.7910413682460785, + "num_tokens": 155445553.0, + "step": 66610 + }, + { + "epoch": 0.6108004034106537, + "learning_rate": 7.784175300265885e-05, + "loss": 0.6781, + "mean_token_accuracy": 0.7924752593040466, + "num_tokens": 155471458.0, + "step": 66620 + }, + { + "epoch": 0.6108920876501329, + "learning_rate": 7.7823416154763e-05, + "loss": 0.6906, + "mean_token_accuracy": 0.7882384598255158, + "num_tokens": 155496276.0, + "step": 66630 + }, + { + "epoch": 0.6109837718896122, + "learning_rate": 7.780507930686716e-05, + "loss": 0.7126, + "mean_token_accuracy": 0.7846039772033692, + "num_tokens": 155522026.0, + "step": 66640 + }, + { + "epoch": 0.6110754561290914, + "learning_rate": 7.77867424589713e-05, + "loss": 0.6756, + "mean_token_accuracy": 0.7927641093730926, + "num_tokens": 155547187.0, + "step": 66650 + }, + { + "epoch": 0.6111671403685707, + "learning_rate": 7.776840561107545e-05, + "loss": 0.7098, + "mean_token_accuracy": 0.7821052551269532, + "num_tokens": 155572669.0, + "step": 66660 + }, + { + "epoch": 0.6112588246080499, + "learning_rate": 7.775006876317962e-05, + "loss": 0.6805, + "mean_token_accuracy": 0.7912693440914154, + "num_tokens": 155597605.0, + "step": 66670 + }, + { + "epoch": 0.6113505088475291, + "learning_rate": 7.773173191528377e-05, + "loss": 0.7139, + "mean_token_accuracy": 0.7910090684890747, + "num_tokens": 155621597.0, + "step": 66680 + }, + { + "epoch": 0.6114421930870083, + "learning_rate": 7.771339506738792e-05, + "loss": 0.6892, + "mean_token_accuracy": 0.7859422266483307, + "num_tokens": 155646764.0, + "step": 66690 + }, + { + "epoch": 0.6115338773264876, + "learning_rate": 7.769505821949207e-05, + "loss": 0.6584, + "mean_token_accuracy": 0.7977186799049377, + "num_tokens": 155671194.0, + "step": 66700 + }, + { + "epoch": 0.6116255615659668, + "learning_rate": 7.767672137159623e-05, + "loss": 0.7097, + "mean_token_accuracy": 0.7835528433322907, + "num_tokens": 155695446.0, + "step": 66710 + }, + { + "epoch": 0.6117172458054461, + "learning_rate": 7.765838452370038e-05, + "loss": 0.6863, + "mean_token_accuracy": 0.7886665225028991, + "num_tokens": 155720593.0, + "step": 66720 + }, + { + "epoch": 0.6118089300449253, + "learning_rate": 7.764004767580453e-05, + "loss": 0.7051, + "mean_token_accuracy": 0.7883149862289429, + "num_tokens": 155745718.0, + "step": 66730 + }, + { + "epoch": 0.6119006142844046, + "learning_rate": 7.76217108279087e-05, + "loss": 0.684, + "mean_token_accuracy": 0.7954345703125, + "num_tokens": 155771621.0, + "step": 66740 + }, + { + "epoch": 0.6119922985238837, + "learning_rate": 7.760337398001283e-05, + "loss": 0.6599, + "mean_token_accuracy": 0.7985195457935333, + "num_tokens": 155797266.0, + "step": 66750 + }, + { + "epoch": 0.612083982763363, + "learning_rate": 7.758503713211699e-05, + "loss": 0.6536, + "mean_token_accuracy": 0.7971826255321502, + "num_tokens": 155822315.0, + "step": 66760 + }, + { + "epoch": 0.6121756670028422, + "learning_rate": 7.756670028422115e-05, + "loss": 0.7785, + "mean_token_accuracy": 0.7700275838375091, + "num_tokens": 155847309.0, + "step": 66770 + }, + { + "epoch": 0.6122673512423215, + "learning_rate": 7.75483634363253e-05, + "loss": 0.6882, + "mean_token_accuracy": 0.7865087866783143, + "num_tokens": 155872658.0, + "step": 66780 + }, + { + "epoch": 0.6123590354818007, + "learning_rate": 7.753002658842945e-05, + "loss": 0.7319, + "mean_token_accuracy": 0.7749264895915985, + "num_tokens": 155897432.0, + "step": 66790 + }, + { + "epoch": 0.61245071972128, + "learning_rate": 7.75116897405336e-05, + "loss": 0.6767, + "mean_token_accuracy": 0.7922833502292633, + "num_tokens": 155923215.0, + "step": 66800 + }, + { + "epoch": 0.6125424039607591, + "learning_rate": 7.749335289263776e-05, + "loss": 0.7127, + "mean_token_accuracy": 0.7818540394306183, + "num_tokens": 155947542.0, + "step": 66810 + }, + { + "epoch": 0.6126340882002383, + "learning_rate": 7.747501604474191e-05, + "loss": 0.6779, + "mean_token_accuracy": 0.7884433686733245, + "num_tokens": 155972351.0, + "step": 66820 + }, + { + "epoch": 0.6127257724397176, + "learning_rate": 7.745667919684606e-05, + "loss": 0.6881, + "mean_token_accuracy": 0.7872499525547028, + "num_tokens": 155997837.0, + "step": 66830 + }, + { + "epoch": 0.6128174566791968, + "learning_rate": 7.743834234895023e-05, + "loss": 0.7038, + "mean_token_accuracy": 0.7881186842918396, + "num_tokens": 156023628.0, + "step": 66840 + }, + { + "epoch": 0.6129091409186761, + "learning_rate": 7.742000550105437e-05, + "loss": 0.6833, + "mean_token_accuracy": 0.7897855699062347, + "num_tokens": 156048835.0, + "step": 66850 + }, + { + "epoch": 0.6130008251581553, + "learning_rate": 7.740166865315852e-05, + "loss": 0.7076, + "mean_token_accuracy": 0.7861597776412964, + "num_tokens": 156074913.0, + "step": 66860 + }, + { + "epoch": 0.6130925093976346, + "learning_rate": 7.738333180526268e-05, + "loss": 0.7162, + "mean_token_accuracy": 0.7880714237689972, + "num_tokens": 156100667.0, + "step": 66870 + }, + { + "epoch": 0.6131841936371137, + "learning_rate": 7.736499495736683e-05, + "loss": 0.6888, + "mean_token_accuracy": 0.7895596146583557, + "num_tokens": 156125793.0, + "step": 66880 + }, + { + "epoch": 0.613275877876593, + "learning_rate": 7.734665810947099e-05, + "loss": 0.7233, + "mean_token_accuracy": 0.7790824055671692, + "num_tokens": 156150583.0, + "step": 66890 + }, + { + "epoch": 0.6133675621160722, + "learning_rate": 7.732832126157514e-05, + "loss": 0.6943, + "mean_token_accuracy": 0.7864419519901276, + "num_tokens": 156176158.0, + "step": 66900 + }, + { + "epoch": 0.6134592463555515, + "learning_rate": 7.730998441367929e-05, + "loss": 0.667, + "mean_token_accuracy": 0.7933214724063873, + "num_tokens": 156201836.0, + "step": 66910 + }, + { + "epoch": 0.6135509305950307, + "learning_rate": 7.729164756578344e-05, + "loss": 0.7022, + "mean_token_accuracy": 0.7909168124198913, + "num_tokens": 156226603.0, + "step": 66920 + }, + { + "epoch": 0.61364261483451, + "learning_rate": 7.727331071788761e-05, + "loss": 0.6734, + "mean_token_accuracy": 0.7896043121814728, + "num_tokens": 156251709.0, + "step": 66930 + }, + { + "epoch": 0.6137342990739891, + "learning_rate": 7.725497386999176e-05, + "loss": 0.7271, + "mean_token_accuracy": 0.781232750415802, + "num_tokens": 156277127.0, + "step": 66940 + }, + { + "epoch": 0.6138259833134684, + "learning_rate": 7.72366370220959e-05, + "loss": 0.6989, + "mean_token_accuracy": 0.7875811159610748, + "num_tokens": 156302300.0, + "step": 66950 + }, + { + "epoch": 0.6139176675529476, + "learning_rate": 7.721830017420005e-05, + "loss": 0.7139, + "mean_token_accuracy": 0.7815785825252533, + "num_tokens": 156327265.0, + "step": 66960 + }, + { + "epoch": 0.6140093517924269, + "learning_rate": 7.719996332630421e-05, + "loss": 0.6665, + "mean_token_accuracy": 0.7898998618125915, + "num_tokens": 156353015.0, + "step": 66970 + }, + { + "epoch": 0.6141010360319061, + "learning_rate": 7.718162647840837e-05, + "loss": 0.7116, + "mean_token_accuracy": 0.7818050742149353, + "num_tokens": 156378368.0, + "step": 66980 + }, + { + "epoch": 0.6141927202713854, + "learning_rate": 7.716328963051252e-05, + "loss": 0.6938, + "mean_token_accuracy": 0.7857789099216461, + "num_tokens": 156403537.0, + "step": 66990 + }, + { + "epoch": 0.6142844045108646, + "learning_rate": 7.714495278261667e-05, + "loss": 0.69, + "mean_token_accuracy": 0.7888389229774475, + "num_tokens": 156428130.0, + "step": 67000 + }, + { + "epoch": 0.6143760887503438, + "learning_rate": 7.712661593472082e-05, + "loss": 0.7437, + "mean_token_accuracy": 0.7711461544036865, + "num_tokens": 156453116.0, + "step": 67010 + }, + { + "epoch": 0.614467772989823, + "learning_rate": 7.710827908682497e-05, + "loss": 0.7387, + "mean_token_accuracy": 0.7768138706684112, + "num_tokens": 156478578.0, + "step": 67020 + }, + { + "epoch": 0.6145594572293023, + "learning_rate": 7.708994223892914e-05, + "loss": 0.6782, + "mean_token_accuracy": 0.7902256846427917, + "num_tokens": 156503763.0, + "step": 67030 + }, + { + "epoch": 0.6146511414687815, + "learning_rate": 7.707160539103329e-05, + "loss": 0.7186, + "mean_token_accuracy": 0.7766977071762085, + "num_tokens": 156529907.0, + "step": 67040 + }, + { + "epoch": 0.6147428257082608, + "learning_rate": 7.705326854313743e-05, + "loss": 0.6821, + "mean_token_accuracy": 0.7826661825180053, + "num_tokens": 156554295.0, + "step": 67050 + }, + { + "epoch": 0.61483450994774, + "learning_rate": 7.70349316952416e-05, + "loss": 0.7177, + "mean_token_accuracy": 0.7832845389842987, + "num_tokens": 156579377.0, + "step": 67060 + }, + { + "epoch": 0.6149261941872192, + "learning_rate": 7.701659484734575e-05, + "loss": 0.6498, + "mean_token_accuracy": 0.7975553512573242, + "num_tokens": 156604321.0, + "step": 67070 + }, + { + "epoch": 0.6150178784266984, + "learning_rate": 7.69982579994499e-05, + "loss": 0.676, + "mean_token_accuracy": 0.7933587968349457, + "num_tokens": 156630279.0, + "step": 67080 + }, + { + "epoch": 0.6151095626661777, + "learning_rate": 7.697992115155405e-05, + "loss": 0.6865, + "mean_token_accuracy": 0.7899942874908448, + "num_tokens": 156655172.0, + "step": 67090 + }, + { + "epoch": 0.6152012469056569, + "learning_rate": 7.69615843036582e-05, + "loss": 0.6712, + "mean_token_accuracy": 0.7936025261878967, + "num_tokens": 156680564.0, + "step": 67100 + }, + { + "epoch": 0.6152929311451362, + "learning_rate": 7.694324745576235e-05, + "loss": 0.6335, + "mean_token_accuracy": 0.7987747192382812, + "num_tokens": 156705787.0, + "step": 67110 + }, + { + "epoch": 0.6153846153846154, + "learning_rate": 7.69249106078665e-05, + "loss": 0.7345, + "mean_token_accuracy": 0.7793562829494476, + "num_tokens": 156730527.0, + "step": 67120 + }, + { + "epoch": 0.6154762996240947, + "learning_rate": 7.690657375997067e-05, + "loss": 0.7091, + "mean_token_accuracy": 0.783651489019394, + "num_tokens": 156755189.0, + "step": 67130 + }, + { + "epoch": 0.6155679838635738, + "learning_rate": 7.688823691207482e-05, + "loss": 0.6564, + "mean_token_accuracy": 0.7978248178958893, + "num_tokens": 156779933.0, + "step": 67140 + }, + { + "epoch": 0.6156596681030531, + "learning_rate": 7.686990006417896e-05, + "loss": 0.7086, + "mean_token_accuracy": 0.7844275593757629, + "num_tokens": 156805423.0, + "step": 67150 + }, + { + "epoch": 0.6157513523425323, + "learning_rate": 7.685156321628313e-05, + "loss": 0.7118, + "mean_token_accuracy": 0.7816203474998474, + "num_tokens": 156829540.0, + "step": 67160 + }, + { + "epoch": 0.6158430365820116, + "learning_rate": 7.683322636838728e-05, + "loss": 0.7119, + "mean_token_accuracy": 0.7806913375854492, + "num_tokens": 156854815.0, + "step": 67170 + }, + { + "epoch": 0.6159347208214908, + "learning_rate": 7.681488952049143e-05, + "loss": 0.674, + "mean_token_accuracy": 0.7896641671657563, + "num_tokens": 156879989.0, + "step": 67180 + }, + { + "epoch": 0.6160264050609701, + "learning_rate": 7.679655267259558e-05, + "loss": 0.683, + "mean_token_accuracy": 0.7872275531291961, + "num_tokens": 156905207.0, + "step": 67190 + }, + { + "epoch": 0.6161180893004492, + "learning_rate": 7.677821582469973e-05, + "loss": 0.6838, + "mean_token_accuracy": 0.7908446371555329, + "num_tokens": 156930267.0, + "step": 67200 + }, + { + "epoch": 0.6162097735399285, + "learning_rate": 7.675987897680389e-05, + "loss": 0.6878, + "mean_token_accuracy": 0.7871572077274323, + "num_tokens": 156955934.0, + "step": 67210 + }, + { + "epoch": 0.6163014577794077, + "learning_rate": 7.674154212890804e-05, + "loss": 0.7319, + "mean_token_accuracy": 0.7791761040687561, + "num_tokens": 156980544.0, + "step": 67220 + }, + { + "epoch": 0.616393142018887, + "learning_rate": 7.67232052810122e-05, + "loss": 0.7133, + "mean_token_accuracy": 0.786835378408432, + "num_tokens": 157005548.0, + "step": 67230 + }, + { + "epoch": 0.6164848262583662, + "learning_rate": 7.670486843311636e-05, + "loss": 0.7041, + "mean_token_accuracy": 0.7829742968082428, + "num_tokens": 157030166.0, + "step": 67240 + }, + { + "epoch": 0.6165765104978455, + "learning_rate": 7.66865315852205e-05, + "loss": 0.6677, + "mean_token_accuracy": 0.790830647945404, + "num_tokens": 157055006.0, + "step": 67250 + }, + { + "epoch": 0.6166681947373247, + "learning_rate": 7.666819473732466e-05, + "loss": 0.673, + "mean_token_accuracy": 0.7910701930522919, + "num_tokens": 157079972.0, + "step": 67260 + }, + { + "epoch": 0.6167598789768038, + "learning_rate": 7.664985788942881e-05, + "loss": 0.6681, + "mean_token_accuracy": 0.7905817687511444, + "num_tokens": 157104639.0, + "step": 67270 + }, + { + "epoch": 0.6168515632162831, + "learning_rate": 7.663152104153296e-05, + "loss": 0.7024, + "mean_token_accuracy": 0.7871637105941772, + "num_tokens": 157129677.0, + "step": 67280 + }, + { + "epoch": 0.6169432474557623, + "learning_rate": 7.661318419363712e-05, + "loss": 0.6734, + "mean_token_accuracy": 0.7909211337566375, + "num_tokens": 157154585.0, + "step": 67290 + }, + { + "epoch": 0.6170349316952416, + "learning_rate": 7.659484734574127e-05, + "loss": 0.6731, + "mean_token_accuracy": 0.7936107039451599, + "num_tokens": 157179804.0, + "step": 67300 + }, + { + "epoch": 0.6171266159347208, + "learning_rate": 7.657651049784542e-05, + "loss": 0.6973, + "mean_token_accuracy": 0.7843657255172729, + "num_tokens": 157205066.0, + "step": 67310 + }, + { + "epoch": 0.6172183001742001, + "learning_rate": 7.655817364994958e-05, + "loss": 0.7115, + "mean_token_accuracy": 0.7843078374862671, + "num_tokens": 157229961.0, + "step": 67320 + }, + { + "epoch": 0.6173099844136792, + "learning_rate": 7.653983680205374e-05, + "loss": 0.6947, + "mean_token_accuracy": 0.788511061668396, + "num_tokens": 157255586.0, + "step": 67330 + }, + { + "epoch": 0.6174016686531585, + "learning_rate": 7.652149995415789e-05, + "loss": 0.6678, + "mean_token_accuracy": 0.7950996577739715, + "num_tokens": 157281970.0, + "step": 67340 + }, + { + "epoch": 0.6174933528926377, + "learning_rate": 7.650316310626203e-05, + "loss": 0.6811, + "mean_token_accuracy": 0.7874180376529694, + "num_tokens": 157307710.0, + "step": 67350 + }, + { + "epoch": 0.617585037132117, + "learning_rate": 7.648482625836619e-05, + "loss": 0.65, + "mean_token_accuracy": 0.7945042431354523, + "num_tokens": 157332924.0, + "step": 67360 + }, + { + "epoch": 0.6176767213715962, + "learning_rate": 7.646648941047034e-05, + "loss": 0.6894, + "mean_token_accuracy": 0.7862263977527618, + "num_tokens": 157358222.0, + "step": 67370 + }, + { + "epoch": 0.6177684056110755, + "learning_rate": 7.64481525625745e-05, + "loss": 0.7443, + "mean_token_accuracy": 0.7707981467247009, + "num_tokens": 157382854.0, + "step": 67380 + }, + { + "epoch": 0.6178600898505547, + "learning_rate": 7.642981571467865e-05, + "loss": 0.7035, + "mean_token_accuracy": 0.7888554453849792, + "num_tokens": 157407841.0, + "step": 67390 + }, + { + "epoch": 0.6179517740900339, + "learning_rate": 7.64114788667828e-05, + "loss": 0.6663, + "mean_token_accuracy": 0.7951247453689575, + "num_tokens": 157432579.0, + "step": 67400 + }, + { + "epoch": 0.6180434583295131, + "learning_rate": 7.639314201888695e-05, + "loss": 0.6863, + "mean_token_accuracy": 0.7897823691368103, + "num_tokens": 157456865.0, + "step": 67410 + }, + { + "epoch": 0.6181351425689924, + "learning_rate": 7.637480517099112e-05, + "loss": 0.7004, + "mean_token_accuracy": 0.7874565184116363, + "num_tokens": 157482026.0, + "step": 67420 + }, + { + "epoch": 0.6182268268084716, + "learning_rate": 7.635646832309527e-05, + "loss": 0.7098, + "mean_token_accuracy": 0.780177116394043, + "num_tokens": 157507826.0, + "step": 67430 + }, + { + "epoch": 0.6183185110479509, + "learning_rate": 7.633813147519942e-05, + "loss": 0.6708, + "mean_token_accuracy": 0.7879915475845337, + "num_tokens": 157533046.0, + "step": 67440 + }, + { + "epoch": 0.6184101952874301, + "learning_rate": 7.631979462730356e-05, + "loss": 0.6771, + "mean_token_accuracy": 0.7879619240760803, + "num_tokens": 157558964.0, + "step": 67450 + }, + { + "epoch": 0.6185018795269093, + "learning_rate": 7.630145777940772e-05, + "loss": 0.6794, + "mean_token_accuracy": 0.7913801431655884, + "num_tokens": 157583569.0, + "step": 67460 + }, + { + "epoch": 0.6185935637663885, + "learning_rate": 7.628312093151188e-05, + "loss": 0.6729, + "mean_token_accuracy": 0.794334328174591, + "num_tokens": 157607935.0, + "step": 67470 + }, + { + "epoch": 0.6186852480058678, + "learning_rate": 7.626478408361603e-05, + "loss": 0.6404, + "mean_token_accuracy": 0.7993609726428985, + "num_tokens": 157633464.0, + "step": 67480 + }, + { + "epoch": 0.618776932245347, + "learning_rate": 7.624644723572018e-05, + "loss": 0.6785, + "mean_token_accuracy": 0.7915915846824646, + "num_tokens": 157659110.0, + "step": 67490 + }, + { + "epoch": 0.6188686164848263, + "learning_rate": 7.622811038782433e-05, + "loss": 0.6898, + "mean_token_accuracy": 0.7868053615093231, + "num_tokens": 157684742.0, + "step": 67500 + }, + { + "epoch": 0.6189603007243055, + "learning_rate": 7.620977353992848e-05, + "loss": 0.6743, + "mean_token_accuracy": 0.7934269189834595, + "num_tokens": 157708553.0, + "step": 67510 + }, + { + "epoch": 0.6190519849637848, + "learning_rate": 7.619143669203265e-05, + "loss": 0.6754, + "mean_token_accuracy": 0.7853560388088227, + "num_tokens": 157733195.0, + "step": 67520 + }, + { + "epoch": 0.6191436692032639, + "learning_rate": 7.61730998441368e-05, + "loss": 0.6756, + "mean_token_accuracy": 0.792363291978836, + "num_tokens": 157758076.0, + "step": 67530 + }, + { + "epoch": 0.6192353534427432, + "learning_rate": 7.615476299624095e-05, + "loss": 0.6926, + "mean_token_accuracy": 0.7883324027061462, + "num_tokens": 157783227.0, + "step": 67540 + }, + { + "epoch": 0.6193270376822224, + "learning_rate": 7.61364261483451e-05, + "loss": 0.6745, + "mean_token_accuracy": 0.7916837930679321, + "num_tokens": 157808657.0, + "step": 67550 + }, + { + "epoch": 0.6194187219217017, + "learning_rate": 7.611808930044926e-05, + "loss": 0.659, + "mean_token_accuracy": 0.7989928483963012, + "num_tokens": 157833941.0, + "step": 67560 + }, + { + "epoch": 0.6195104061611809, + "learning_rate": 7.609975245255341e-05, + "loss": 0.7092, + "mean_token_accuracy": 0.7815617918968201, + "num_tokens": 157858955.0, + "step": 67570 + }, + { + "epoch": 0.6196020904006602, + "learning_rate": 7.608141560465756e-05, + "loss": 0.6927, + "mean_token_accuracy": 0.789283150434494, + "num_tokens": 157884222.0, + "step": 67580 + }, + { + "epoch": 0.6196937746401393, + "learning_rate": 7.606307875676171e-05, + "loss": 0.6934, + "mean_token_accuracy": 0.7907307505607605, + "num_tokens": 157909958.0, + "step": 67590 + }, + { + "epoch": 0.6197854588796186, + "learning_rate": 7.604474190886586e-05, + "loss": 0.7398, + "mean_token_accuracy": 0.774592113494873, + "num_tokens": 157935871.0, + "step": 67600 + }, + { + "epoch": 0.6198771431190978, + "learning_rate": 7.602640506097002e-05, + "loss": 0.7288, + "mean_token_accuracy": 0.7738948345184327, + "num_tokens": 157962152.0, + "step": 67610 + }, + { + "epoch": 0.6199688273585771, + "learning_rate": 7.600806821307418e-05, + "loss": 0.7182, + "mean_token_accuracy": 0.7898809969425201, + "num_tokens": 157987051.0, + "step": 67620 + }, + { + "epoch": 0.6200605115980563, + "learning_rate": 7.598973136517833e-05, + "loss": 0.7003, + "mean_token_accuracy": 0.7832739412784576, + "num_tokens": 158012377.0, + "step": 67630 + }, + { + "epoch": 0.6201521958375356, + "learning_rate": 7.597139451728248e-05, + "loss": 0.6528, + "mean_token_accuracy": 0.7969177067279816, + "num_tokens": 158036551.0, + "step": 67640 + }, + { + "epoch": 0.6202438800770148, + "learning_rate": 7.595305766938664e-05, + "loss": 0.6872, + "mean_token_accuracy": 0.7888841569423676, + "num_tokens": 158061939.0, + "step": 67650 + }, + { + "epoch": 0.620335564316494, + "learning_rate": 7.593472082149079e-05, + "loss": 0.7137, + "mean_token_accuracy": 0.7862693428993225, + "num_tokens": 158087081.0, + "step": 67660 + }, + { + "epoch": 0.6204272485559732, + "learning_rate": 7.591638397359494e-05, + "loss": 0.6574, + "mean_token_accuracy": 0.79624143242836, + "num_tokens": 158112517.0, + "step": 67670 + }, + { + "epoch": 0.6205189327954524, + "learning_rate": 7.58980471256991e-05, + "loss": 0.6847, + "mean_token_accuracy": 0.7950810492038727, + "num_tokens": 158138209.0, + "step": 67680 + }, + { + "epoch": 0.6206106170349317, + "learning_rate": 7.587971027780324e-05, + "loss": 0.7043, + "mean_token_accuracy": 0.7870907127857208, + "num_tokens": 158163371.0, + "step": 67690 + }, + { + "epoch": 0.620702301274411, + "learning_rate": 7.58613734299074e-05, + "loss": 0.7176, + "mean_token_accuracy": 0.7789473712444306, + "num_tokens": 158189126.0, + "step": 67700 + }, + { + "epoch": 0.6207939855138902, + "learning_rate": 7.584303658201155e-05, + "loss": 0.7079, + "mean_token_accuracy": 0.7856812477111816, + "num_tokens": 158213851.0, + "step": 67710 + }, + { + "epoch": 0.6208856697533695, + "learning_rate": 7.582469973411571e-05, + "loss": 0.6688, + "mean_token_accuracy": 0.7929436683654785, + "num_tokens": 158238262.0, + "step": 67720 + }, + { + "epoch": 0.6209773539928486, + "learning_rate": 7.580636288621987e-05, + "loss": 0.6784, + "mean_token_accuracy": 0.793372493982315, + "num_tokens": 158263671.0, + "step": 67730 + }, + { + "epoch": 0.6210690382323278, + "learning_rate": 7.578802603832402e-05, + "loss": 0.6735, + "mean_token_accuracy": 0.7910674631595611, + "num_tokens": 158289257.0, + "step": 67740 + }, + { + "epoch": 0.6211607224718071, + "learning_rate": 7.576968919042817e-05, + "loss": 0.6598, + "mean_token_accuracy": 0.7980355381965637, + "num_tokens": 158314173.0, + "step": 67750 + }, + { + "epoch": 0.6212524067112863, + "learning_rate": 7.575135234253232e-05, + "loss": 0.7411, + "mean_token_accuracy": 0.7710571587085724, + "num_tokens": 158339097.0, + "step": 67760 + }, + { + "epoch": 0.6213440909507656, + "learning_rate": 7.573301549463647e-05, + "loss": 0.6912, + "mean_token_accuracy": 0.7877136707305908, + "num_tokens": 158364302.0, + "step": 67770 + }, + { + "epoch": 0.6214357751902448, + "learning_rate": 7.571467864674064e-05, + "loss": 0.6822, + "mean_token_accuracy": 0.784754729270935, + "num_tokens": 158389615.0, + "step": 67780 + }, + { + "epoch": 0.621527459429724, + "learning_rate": 7.569634179884478e-05, + "loss": 0.6901, + "mean_token_accuracy": 0.7908022820949554, + "num_tokens": 158414937.0, + "step": 67790 + }, + { + "epoch": 0.6216191436692032, + "learning_rate": 7.567800495094893e-05, + "loss": 0.7016, + "mean_token_accuracy": 0.7832824528217316, + "num_tokens": 158440457.0, + "step": 67800 + }, + { + "epoch": 0.6217108279086825, + "learning_rate": 7.56596681030531e-05, + "loss": 0.7132, + "mean_token_accuracy": 0.7835166871547699, + "num_tokens": 158465443.0, + "step": 67810 + }, + { + "epoch": 0.6218025121481617, + "learning_rate": 7.564133125515725e-05, + "loss": 0.7072, + "mean_token_accuracy": 0.7831239640712738, + "num_tokens": 158490287.0, + "step": 67820 + }, + { + "epoch": 0.621894196387641, + "learning_rate": 7.56229944072614e-05, + "loss": 0.7148, + "mean_token_accuracy": 0.7799515902996064, + "num_tokens": 158515253.0, + "step": 67830 + }, + { + "epoch": 0.6219858806271202, + "learning_rate": 7.560465755936555e-05, + "loss": 0.6924, + "mean_token_accuracy": 0.7871422111988068, + "num_tokens": 158540757.0, + "step": 67840 + }, + { + "epoch": 0.6220775648665995, + "learning_rate": 7.55863207114697e-05, + "loss": 0.7205, + "mean_token_accuracy": 0.7767223000526429, + "num_tokens": 158565672.0, + "step": 67850 + }, + { + "epoch": 0.6221692491060786, + "learning_rate": 7.556798386357385e-05, + "loss": 0.657, + "mean_token_accuracy": 0.7968750596046448, + "num_tokens": 158590417.0, + "step": 67860 + }, + { + "epoch": 0.6222609333455579, + "learning_rate": 7.5549647015678e-05, + "loss": 0.6996, + "mean_token_accuracy": 0.7919406414031982, + "num_tokens": 158616112.0, + "step": 67870 + }, + { + "epoch": 0.6223526175850371, + "learning_rate": 7.553131016778217e-05, + "loss": 0.6979, + "mean_token_accuracy": 0.7862891614437103, + "num_tokens": 158641112.0, + "step": 67880 + }, + { + "epoch": 0.6224443018245164, + "learning_rate": 7.551297331988631e-05, + "loss": 0.6621, + "mean_token_accuracy": 0.7982531368732453, + "num_tokens": 158666558.0, + "step": 67890 + }, + { + "epoch": 0.6225359860639956, + "learning_rate": 7.549463647199046e-05, + "loss": 0.7145, + "mean_token_accuracy": 0.7796647191047669, + "num_tokens": 158691011.0, + "step": 67900 + }, + { + "epoch": 0.6226276703034749, + "learning_rate": 7.547629962409463e-05, + "loss": 0.6755, + "mean_token_accuracy": 0.7932925701141358, + "num_tokens": 158716251.0, + "step": 67910 + }, + { + "epoch": 0.622719354542954, + "learning_rate": 7.545796277619878e-05, + "loss": 0.6513, + "mean_token_accuracy": 0.7988629639148712, + "num_tokens": 158740514.0, + "step": 67920 + }, + { + "epoch": 0.6228110387824333, + "learning_rate": 7.543962592830293e-05, + "loss": 0.6702, + "mean_token_accuracy": 0.7902235269546509, + "num_tokens": 158765137.0, + "step": 67930 + }, + { + "epoch": 0.6229027230219125, + "learning_rate": 7.542128908040708e-05, + "loss": 0.7062, + "mean_token_accuracy": 0.7847516477108002, + "num_tokens": 158789701.0, + "step": 67940 + }, + { + "epoch": 0.6229944072613918, + "learning_rate": 7.540295223251123e-05, + "loss": 0.6742, + "mean_token_accuracy": 0.7943823873996735, + "num_tokens": 158814902.0, + "step": 67950 + }, + { + "epoch": 0.623086091500871, + "learning_rate": 7.538461538461539e-05, + "loss": 0.7007, + "mean_token_accuracy": 0.7827964663505554, + "num_tokens": 158839992.0, + "step": 67960 + }, + { + "epoch": 0.6231777757403503, + "learning_rate": 7.536627853671954e-05, + "loss": 0.6837, + "mean_token_accuracy": 0.7875102579593658, + "num_tokens": 158864454.0, + "step": 67970 + }, + { + "epoch": 0.6232694599798295, + "learning_rate": 7.53479416888237e-05, + "loss": 0.6534, + "mean_token_accuracy": 0.7980010867118835, + "num_tokens": 158889217.0, + "step": 67980 + }, + { + "epoch": 0.6233611442193087, + "learning_rate": 7.532960484092784e-05, + "loss": 0.685, + "mean_token_accuracy": 0.7899937689304352, + "num_tokens": 158913924.0, + "step": 67990 + }, + { + "epoch": 0.6234528284587879, + "learning_rate": 7.531126799303199e-05, + "loss": 0.6946, + "mean_token_accuracy": 0.78940549492836, + "num_tokens": 158939065.0, + "step": 68000 + }, + { + "epoch": 0.6235445126982672, + "learning_rate": 7.529293114513616e-05, + "loss": 0.6984, + "mean_token_accuracy": 0.7817919611930847, + "num_tokens": 158965309.0, + "step": 68010 + }, + { + "epoch": 0.6236361969377464, + "learning_rate": 7.527459429724031e-05, + "loss": 0.6909, + "mean_token_accuracy": 0.781625235080719, + "num_tokens": 158990683.0, + "step": 68020 + }, + { + "epoch": 0.6237278811772257, + "learning_rate": 7.525625744934446e-05, + "loss": 0.6671, + "mean_token_accuracy": 0.7947934448719025, + "num_tokens": 159016280.0, + "step": 68030 + }, + { + "epoch": 0.6238195654167049, + "learning_rate": 7.523792060144861e-05, + "loss": 0.6937, + "mean_token_accuracy": 0.7849284529685974, + "num_tokens": 159041934.0, + "step": 68040 + }, + { + "epoch": 0.623911249656184, + "learning_rate": 7.521958375355277e-05, + "loss": 0.6812, + "mean_token_accuracy": 0.789916741847992, + "num_tokens": 159067684.0, + "step": 68050 + }, + { + "epoch": 0.6240029338956633, + "learning_rate": 7.520124690565692e-05, + "loss": 0.6706, + "mean_token_accuracy": 0.7881591260433197, + "num_tokens": 159093100.0, + "step": 68060 + }, + { + "epoch": 0.6240946181351426, + "learning_rate": 7.518291005776107e-05, + "loss": 0.7146, + "mean_token_accuracy": 0.7809472620487213, + "num_tokens": 159118988.0, + "step": 68070 + }, + { + "epoch": 0.6241863023746218, + "learning_rate": 7.516457320986523e-05, + "loss": 0.6568, + "mean_token_accuracy": 0.7976008296012879, + "num_tokens": 159144479.0, + "step": 68080 + }, + { + "epoch": 0.624277986614101, + "learning_rate": 7.514623636196937e-05, + "loss": 0.6609, + "mean_token_accuracy": 0.7967592477798462, + "num_tokens": 159169705.0, + "step": 68090 + }, + { + "epoch": 0.6243696708535803, + "learning_rate": 7.512789951407353e-05, + "loss": 0.6936, + "mean_token_accuracy": 0.7881568074226379, + "num_tokens": 159195729.0, + "step": 68100 + }, + { + "epoch": 0.6244613550930596, + "learning_rate": 7.510956266617769e-05, + "loss": 0.721, + "mean_token_accuracy": 0.781345933675766, + "num_tokens": 159219812.0, + "step": 68110 + }, + { + "epoch": 0.6245530393325387, + "learning_rate": 7.509122581828184e-05, + "loss": 0.6658, + "mean_token_accuracy": 0.7950010359287262, + "num_tokens": 159244728.0, + "step": 68120 + }, + { + "epoch": 0.624644723572018, + "learning_rate": 7.5072888970386e-05, + "loss": 0.663, + "mean_token_accuracy": 0.7935277819633484, + "num_tokens": 159271032.0, + "step": 68130 + }, + { + "epoch": 0.6247364078114972, + "learning_rate": 7.505455212249015e-05, + "loss": 0.6694, + "mean_token_accuracy": 0.7925786733627319, + "num_tokens": 159295563.0, + "step": 68140 + }, + { + "epoch": 0.6248280920509764, + "learning_rate": 7.50362152745943e-05, + "loss": 0.6793, + "mean_token_accuracy": 0.7868499159812927, + "num_tokens": 159320547.0, + "step": 68150 + }, + { + "epoch": 0.6249197762904557, + "learning_rate": 7.501787842669845e-05, + "loss": 0.6916, + "mean_token_accuracy": 0.7876942098140717, + "num_tokens": 159345078.0, + "step": 68160 + }, + { + "epoch": 0.625011460529935, + "learning_rate": 7.499954157880262e-05, + "loss": 0.7137, + "mean_token_accuracy": 0.787305474281311, + "num_tokens": 159370032.0, + "step": 68170 + }, + { + "epoch": 0.6251031447694141, + "learning_rate": 7.498120473090677e-05, + "loss": 0.7139, + "mean_token_accuracy": 0.7832253873348236, + "num_tokens": 159395624.0, + "step": 68180 + }, + { + "epoch": 0.6251948290088933, + "learning_rate": 7.49628678830109e-05, + "loss": 0.6923, + "mean_token_accuracy": 0.7877730906009675, + "num_tokens": 159421516.0, + "step": 68190 + }, + { + "epoch": 0.6252865132483726, + "learning_rate": 7.494453103511506e-05, + "loss": 0.7026, + "mean_token_accuracy": 0.7831994831562042, + "num_tokens": 159446982.0, + "step": 68200 + }, + { + "epoch": 0.6253781974878518, + "learning_rate": 7.492619418721922e-05, + "loss": 0.6846, + "mean_token_accuracy": 0.792252266407013, + "num_tokens": 159472086.0, + "step": 68210 + }, + { + "epoch": 0.6254698817273311, + "learning_rate": 7.490785733932337e-05, + "loss": 0.6524, + "mean_token_accuracy": 0.7992007553577423, + "num_tokens": 159497352.0, + "step": 68220 + }, + { + "epoch": 0.6255615659668103, + "learning_rate": 7.488952049142753e-05, + "loss": 0.6822, + "mean_token_accuracy": 0.7904492437839508, + "num_tokens": 159522219.0, + "step": 68230 + }, + { + "epoch": 0.6256532502062896, + "learning_rate": 7.487118364353168e-05, + "loss": 0.7184, + "mean_token_accuracy": 0.7877139449119568, + "num_tokens": 159547681.0, + "step": 68240 + }, + { + "epoch": 0.6257449344457687, + "learning_rate": 7.485284679563583e-05, + "loss": 0.7304, + "mean_token_accuracy": 0.7756365776062012, + "num_tokens": 159574205.0, + "step": 68250 + }, + { + "epoch": 0.625836618685248, + "learning_rate": 7.483450994773998e-05, + "loss": 0.7168, + "mean_token_accuracy": 0.7812732100486756, + "num_tokens": 159599703.0, + "step": 68260 + }, + { + "epoch": 0.6259283029247272, + "learning_rate": 7.481617309984415e-05, + "loss": 0.6825, + "mean_token_accuracy": 0.7851893424987793, + "num_tokens": 159625739.0, + "step": 68270 + }, + { + "epoch": 0.6260199871642065, + "learning_rate": 7.47978362519483e-05, + "loss": 0.7585, + "mean_token_accuracy": 0.7742206215858459, + "num_tokens": 159651381.0, + "step": 68280 + }, + { + "epoch": 0.6261116714036857, + "learning_rate": 7.477949940405244e-05, + "loss": 0.6818, + "mean_token_accuracy": 0.7892438113689423, + "num_tokens": 159677000.0, + "step": 68290 + }, + { + "epoch": 0.626203355643165, + "learning_rate": 7.47611625561566e-05, + "loss": 0.6823, + "mean_token_accuracy": 0.7935108661651611, + "num_tokens": 159702447.0, + "step": 68300 + }, + { + "epoch": 0.6262950398826441, + "learning_rate": 7.474282570826075e-05, + "loss": 0.6853, + "mean_token_accuracy": 0.7863902390003205, + "num_tokens": 159727576.0, + "step": 68310 + }, + { + "epoch": 0.6263867241221234, + "learning_rate": 7.47244888603649e-05, + "loss": 0.6942, + "mean_token_accuracy": 0.7879535675048828, + "num_tokens": 159752600.0, + "step": 68320 + }, + { + "epoch": 0.6264784083616026, + "learning_rate": 7.470615201246906e-05, + "loss": 0.6898, + "mean_token_accuracy": 0.7876635611057281, + "num_tokens": 159777417.0, + "step": 68330 + }, + { + "epoch": 0.6265700926010819, + "learning_rate": 7.468781516457321e-05, + "loss": 0.6535, + "mean_token_accuracy": 0.7975645959377289, + "num_tokens": 159802098.0, + "step": 68340 + }, + { + "epoch": 0.6266617768405611, + "learning_rate": 7.466947831667736e-05, + "loss": 0.6866, + "mean_token_accuracy": 0.7913213193416595, + "num_tokens": 159827170.0, + "step": 68350 + }, + { + "epoch": 0.6267534610800404, + "learning_rate": 7.465114146878151e-05, + "loss": 0.6605, + "mean_token_accuracy": 0.7892809808254242, + "num_tokens": 159852126.0, + "step": 68360 + }, + { + "epoch": 0.6268451453195196, + "learning_rate": 7.463280462088568e-05, + "loss": 0.6893, + "mean_token_accuracy": 0.790635347366333, + "num_tokens": 159877759.0, + "step": 68370 + }, + { + "epoch": 0.6269368295589988, + "learning_rate": 7.461446777298983e-05, + "loss": 0.7017, + "mean_token_accuracy": 0.7819789409637451, + "num_tokens": 159903098.0, + "step": 68380 + }, + { + "epoch": 0.627028513798478, + "learning_rate": 7.459613092509398e-05, + "loss": 0.6865, + "mean_token_accuracy": 0.785049992799759, + "num_tokens": 159928235.0, + "step": 68390 + }, + { + "epoch": 0.6271201980379573, + "learning_rate": 7.457779407719814e-05, + "loss": 0.6836, + "mean_token_accuracy": 0.7889967024326324, + "num_tokens": 159953100.0, + "step": 68400 + }, + { + "epoch": 0.6272118822774365, + "learning_rate": 7.455945722930229e-05, + "loss": 0.6901, + "mean_token_accuracy": 0.7829911768436432, + "num_tokens": 159977772.0, + "step": 68410 + }, + { + "epoch": 0.6273035665169158, + "learning_rate": 7.454112038140644e-05, + "loss": 0.691, + "mean_token_accuracy": 0.7903009057044983, + "num_tokens": 160003315.0, + "step": 68420 + }, + { + "epoch": 0.627395250756395, + "learning_rate": 7.45227835335106e-05, + "loss": 0.696, + "mean_token_accuracy": 0.7848869740962983, + "num_tokens": 160028126.0, + "step": 68430 + }, + { + "epoch": 0.6274869349958742, + "learning_rate": 7.450444668561474e-05, + "loss": 0.7172, + "mean_token_accuracy": 0.7832297563552857, + "num_tokens": 160053885.0, + "step": 68440 + }, + { + "epoch": 0.6275786192353534, + "learning_rate": 7.44861098377189e-05, + "loss": 0.7098, + "mean_token_accuracy": 0.7870866298675537, + "num_tokens": 160079105.0, + "step": 68450 + }, + { + "epoch": 0.6276703034748327, + "learning_rate": 7.446777298982305e-05, + "loss": 0.6725, + "mean_token_accuracy": 0.79354248046875, + "num_tokens": 160103810.0, + "step": 68460 + }, + { + "epoch": 0.6277619877143119, + "learning_rate": 7.444943614192721e-05, + "loss": 0.7052, + "mean_token_accuracy": 0.7852420270442962, + "num_tokens": 160129041.0, + "step": 68470 + }, + { + "epoch": 0.6278536719537912, + "learning_rate": 7.443109929403136e-05, + "loss": 0.7034, + "mean_token_accuracy": 0.7870183765888215, + "num_tokens": 160154299.0, + "step": 68480 + }, + { + "epoch": 0.6279453561932704, + "learning_rate": 7.441276244613552e-05, + "loss": 0.6687, + "mean_token_accuracy": 0.792228901386261, + "num_tokens": 160180271.0, + "step": 68490 + }, + { + "epoch": 0.6280370404327497, + "learning_rate": 7.439442559823967e-05, + "loss": 0.7165, + "mean_token_accuracy": 0.7853408753871918, + "num_tokens": 160205271.0, + "step": 68500 + }, + { + "epoch": 0.6281287246722288, + "learning_rate": 7.437608875034382e-05, + "loss": 0.6822, + "mean_token_accuracy": 0.7885018885135651, + "num_tokens": 160230505.0, + "step": 68510 + }, + { + "epoch": 0.628220408911708, + "learning_rate": 7.435775190244797e-05, + "loss": 0.6792, + "mean_token_accuracy": 0.7850334107875824, + "num_tokens": 160255950.0, + "step": 68520 + }, + { + "epoch": 0.6283120931511873, + "learning_rate": 7.433941505455214e-05, + "loss": 0.6909, + "mean_token_accuracy": 0.78346386551857, + "num_tokens": 160280976.0, + "step": 68530 + }, + { + "epoch": 0.6284037773906666, + "learning_rate": 7.432107820665627e-05, + "loss": 0.6505, + "mean_token_accuracy": 0.7980206906795502, + "num_tokens": 160305881.0, + "step": 68540 + }, + { + "epoch": 0.6284954616301458, + "learning_rate": 7.430274135876043e-05, + "loss": 0.6826, + "mean_token_accuracy": 0.7878010094165802, + "num_tokens": 160331851.0, + "step": 68550 + }, + { + "epoch": 0.628587145869625, + "learning_rate": 7.428440451086459e-05, + "loss": 0.7262, + "mean_token_accuracy": 0.7825631320476532, + "num_tokens": 160356091.0, + "step": 68560 + }, + { + "epoch": 0.6286788301091042, + "learning_rate": 7.426606766296874e-05, + "loss": 0.6708, + "mean_token_accuracy": 0.7878499090671539, + "num_tokens": 160381118.0, + "step": 68570 + }, + { + "epoch": 0.6287705143485834, + "learning_rate": 7.42477308150729e-05, + "loss": 0.6771, + "mean_token_accuracy": 0.7930330097675323, + "num_tokens": 160406181.0, + "step": 68580 + }, + { + "epoch": 0.6288621985880627, + "learning_rate": 7.422939396717705e-05, + "loss": 0.69, + "mean_token_accuracy": 0.7923729062080384, + "num_tokens": 160431267.0, + "step": 68590 + }, + { + "epoch": 0.6289538828275419, + "learning_rate": 7.42110571192812e-05, + "loss": 0.6805, + "mean_token_accuracy": 0.7918398797512054, + "num_tokens": 160456798.0, + "step": 68600 + }, + { + "epoch": 0.6290455670670212, + "learning_rate": 7.419272027138535e-05, + "loss": 0.6748, + "mean_token_accuracy": 0.7926307797431946, + "num_tokens": 160481610.0, + "step": 68610 + }, + { + "epoch": 0.6291372513065004, + "learning_rate": 7.41743834234895e-05, + "loss": 0.669, + "mean_token_accuracy": 0.7898163974285126, + "num_tokens": 160506613.0, + "step": 68620 + }, + { + "epoch": 0.6292289355459797, + "learning_rate": 7.415604657559367e-05, + "loss": 0.6936, + "mean_token_accuracy": 0.7894938290119171, + "num_tokens": 160531525.0, + "step": 68630 + }, + { + "epoch": 0.6293206197854588, + "learning_rate": 7.413770972769781e-05, + "loss": 0.6822, + "mean_token_accuracy": 0.7915955781936646, + "num_tokens": 160557369.0, + "step": 68640 + }, + { + "epoch": 0.6294123040249381, + "learning_rate": 7.411937287980196e-05, + "loss": 0.6929, + "mean_token_accuracy": 0.7915159463882446, + "num_tokens": 160582371.0, + "step": 68650 + }, + { + "epoch": 0.6295039882644173, + "learning_rate": 7.410103603190612e-05, + "loss": 0.674, + "mean_token_accuracy": 0.7909412145614624, + "num_tokens": 160607686.0, + "step": 68660 + }, + { + "epoch": 0.6295956725038966, + "learning_rate": 7.408269918401028e-05, + "loss": 0.6877, + "mean_token_accuracy": 0.7856991171836853, + "num_tokens": 160633502.0, + "step": 68670 + }, + { + "epoch": 0.6296873567433758, + "learning_rate": 7.406436233611443e-05, + "loss": 0.7075, + "mean_token_accuracy": 0.783650916814804, + "num_tokens": 160658327.0, + "step": 68680 + }, + { + "epoch": 0.6297790409828551, + "learning_rate": 7.404602548821858e-05, + "loss": 0.6849, + "mean_token_accuracy": 0.7868337094783783, + "num_tokens": 160683193.0, + "step": 68690 + }, + { + "epoch": 0.6298707252223342, + "learning_rate": 7.402768864032273e-05, + "loss": 0.6806, + "mean_token_accuracy": 0.7953231811523438, + "num_tokens": 160708083.0, + "step": 68700 + }, + { + "epoch": 0.6299624094618135, + "learning_rate": 7.400935179242688e-05, + "loss": 0.6698, + "mean_token_accuracy": 0.7883341610431671, + "num_tokens": 160733797.0, + "step": 68710 + }, + { + "epoch": 0.6300540937012927, + "learning_rate": 7.399101494453104e-05, + "loss": 0.6896, + "mean_token_accuracy": 0.7837846398353576, + "num_tokens": 160758505.0, + "step": 68720 + }, + { + "epoch": 0.630145777940772, + "learning_rate": 7.39726780966352e-05, + "loss": 0.6595, + "mean_token_accuracy": 0.7963154077529907, + "num_tokens": 160783497.0, + "step": 68730 + }, + { + "epoch": 0.6302374621802512, + "learning_rate": 7.395434124873934e-05, + "loss": 0.6693, + "mean_token_accuracy": 0.7931505084037781, + "num_tokens": 160808186.0, + "step": 68740 + }, + { + "epoch": 0.6303291464197305, + "learning_rate": 7.393600440084349e-05, + "loss": 0.6868, + "mean_token_accuracy": 0.7925294160842895, + "num_tokens": 160833366.0, + "step": 68750 + }, + { + "epoch": 0.6304208306592097, + "learning_rate": 7.391766755294766e-05, + "loss": 0.6862, + "mean_token_accuracy": 0.7858851671218872, + "num_tokens": 160858612.0, + "step": 68760 + }, + { + "epoch": 0.6305125148986889, + "learning_rate": 7.389933070505181e-05, + "loss": 0.692, + "mean_token_accuracy": 0.7893398821353912, + "num_tokens": 160883137.0, + "step": 68770 + }, + { + "epoch": 0.6306041991381681, + "learning_rate": 7.388099385715596e-05, + "loss": 0.6627, + "mean_token_accuracy": 0.7915483295917511, + "num_tokens": 160907773.0, + "step": 68780 + }, + { + "epoch": 0.6306958833776474, + "learning_rate": 7.386265700926011e-05, + "loss": 0.6896, + "mean_token_accuracy": 0.7855119585990906, + "num_tokens": 160932706.0, + "step": 68790 + }, + { + "epoch": 0.6307875676171266, + "learning_rate": 7.384432016136426e-05, + "loss": 0.6736, + "mean_token_accuracy": 0.789964210987091, + "num_tokens": 160958373.0, + "step": 68800 + }, + { + "epoch": 0.6308792518566059, + "learning_rate": 7.382598331346842e-05, + "loss": 0.7153, + "mean_token_accuracy": 0.7786109328269959, + "num_tokens": 160983703.0, + "step": 68810 + }, + { + "epoch": 0.6309709360960851, + "learning_rate": 7.380764646557257e-05, + "loss": 0.679, + "mean_token_accuracy": 0.7911896884441376, + "num_tokens": 161008482.0, + "step": 68820 + }, + { + "epoch": 0.6310626203355643, + "learning_rate": 7.378930961767673e-05, + "loss": 0.7013, + "mean_token_accuracy": 0.7846454560756684, + "num_tokens": 161034256.0, + "step": 68830 + }, + { + "epoch": 0.6311543045750435, + "learning_rate": 7.377097276978087e-05, + "loss": 0.6884, + "mean_token_accuracy": 0.78794926404953, + "num_tokens": 161059363.0, + "step": 68840 + }, + { + "epoch": 0.6312459888145228, + "learning_rate": 7.375263592188502e-05, + "loss": 0.6919, + "mean_token_accuracy": 0.7892571866512299, + "num_tokens": 161085394.0, + "step": 68850 + }, + { + "epoch": 0.631337673054002, + "learning_rate": 7.373429907398919e-05, + "loss": 0.7015, + "mean_token_accuracy": 0.7867662668228149, + "num_tokens": 161111050.0, + "step": 68860 + }, + { + "epoch": 0.6314293572934813, + "learning_rate": 7.371596222609334e-05, + "loss": 0.6986, + "mean_token_accuracy": 0.7836301028728485, + "num_tokens": 161136643.0, + "step": 68870 + }, + { + "epoch": 0.6315210415329605, + "learning_rate": 7.369762537819749e-05, + "loss": 0.6755, + "mean_token_accuracy": 0.7927794218063354, + "num_tokens": 161161751.0, + "step": 68880 + }, + { + "epoch": 0.6316127257724398, + "learning_rate": 7.367928853030164e-05, + "loss": 0.6777, + "mean_token_accuracy": 0.7892790138721466, + "num_tokens": 161186799.0, + "step": 68890 + }, + { + "epoch": 0.6317044100119189, + "learning_rate": 7.36609516824058e-05, + "loss": 0.7165, + "mean_token_accuracy": 0.7814065635204315, + "num_tokens": 161211957.0, + "step": 68900 + }, + { + "epoch": 0.6317960942513982, + "learning_rate": 7.364261483450995e-05, + "loss": 0.6671, + "mean_token_accuracy": 0.7912361443042755, + "num_tokens": 161237330.0, + "step": 68910 + }, + { + "epoch": 0.6318877784908774, + "learning_rate": 7.362427798661411e-05, + "loss": 0.6828, + "mean_token_accuracy": 0.7898914694786072, + "num_tokens": 161262585.0, + "step": 68920 + }, + { + "epoch": 0.6319794627303567, + "learning_rate": 7.360594113871827e-05, + "loss": 0.707, + "mean_token_accuracy": 0.7798745572566986, + "num_tokens": 161287252.0, + "step": 68930 + }, + { + "epoch": 0.6320711469698359, + "learning_rate": 7.35876042908224e-05, + "loss": 0.7061, + "mean_token_accuracy": 0.783891624212265, + "num_tokens": 161312592.0, + "step": 68940 + }, + { + "epoch": 0.6321628312093152, + "learning_rate": 7.356926744292656e-05, + "loss": 0.6751, + "mean_token_accuracy": 0.7935016095638275, + "num_tokens": 161338525.0, + "step": 68950 + }, + { + "epoch": 0.6322545154487944, + "learning_rate": 7.355093059503072e-05, + "loss": 0.6708, + "mean_token_accuracy": 0.7926486909389496, + "num_tokens": 161364118.0, + "step": 68960 + }, + { + "epoch": 0.6323461996882735, + "learning_rate": 7.353259374713487e-05, + "loss": 0.6722, + "mean_token_accuracy": 0.7905098676681519, + "num_tokens": 161388450.0, + "step": 68970 + }, + { + "epoch": 0.6324378839277528, + "learning_rate": 7.351425689923902e-05, + "loss": 0.7016, + "mean_token_accuracy": 0.7835709631443024, + "num_tokens": 161412983.0, + "step": 68980 + }, + { + "epoch": 0.632529568167232, + "learning_rate": 7.349592005134318e-05, + "loss": 0.6919, + "mean_token_accuracy": 0.7910090208053588, + "num_tokens": 161437942.0, + "step": 68990 + }, + { + "epoch": 0.6326212524067113, + "learning_rate": 7.347758320344733e-05, + "loss": 0.6809, + "mean_token_accuracy": 0.7874048054218292, + "num_tokens": 161463038.0, + "step": 69000 + }, + { + "epoch": 0.6327129366461905, + "learning_rate": 7.345924635555148e-05, + "loss": 0.708, + "mean_token_accuracy": 0.7828868746757507, + "num_tokens": 161488773.0, + "step": 69010 + }, + { + "epoch": 0.6328046208856698, + "learning_rate": 7.344090950765565e-05, + "loss": 0.7318, + "mean_token_accuracy": 0.7716870784759522, + "num_tokens": 161513785.0, + "step": 69020 + }, + { + "epoch": 0.6328963051251489, + "learning_rate": 7.34225726597598e-05, + "loss": 0.6856, + "mean_token_accuracy": 0.7896718978881836, + "num_tokens": 161538439.0, + "step": 69030 + }, + { + "epoch": 0.6329879893646282, + "learning_rate": 7.340423581186394e-05, + "loss": 0.6831, + "mean_token_accuracy": 0.7908432126045227, + "num_tokens": 161562950.0, + "step": 69040 + }, + { + "epoch": 0.6330796736041074, + "learning_rate": 7.33858989639681e-05, + "loss": 0.6893, + "mean_token_accuracy": 0.7905107736587524, + "num_tokens": 161588169.0, + "step": 69050 + }, + { + "epoch": 0.6331713578435867, + "learning_rate": 7.336756211607225e-05, + "loss": 0.7245, + "mean_token_accuracy": 0.7878206551074982, + "num_tokens": 161613299.0, + "step": 69060 + }, + { + "epoch": 0.6332630420830659, + "learning_rate": 7.33492252681764e-05, + "loss": 0.717, + "mean_token_accuracy": 0.7835732758045196, + "num_tokens": 161638649.0, + "step": 69070 + }, + { + "epoch": 0.6333547263225452, + "learning_rate": 7.333088842028056e-05, + "loss": 0.6768, + "mean_token_accuracy": 0.78575519323349, + "num_tokens": 161663574.0, + "step": 69080 + }, + { + "epoch": 0.6334464105620244, + "learning_rate": 7.331255157238471e-05, + "loss": 0.6744, + "mean_token_accuracy": 0.7893391013145447, + "num_tokens": 161689046.0, + "step": 69090 + }, + { + "epoch": 0.6335380948015036, + "learning_rate": 7.329421472448886e-05, + "loss": 0.6397, + "mean_token_accuracy": 0.8034017860889435, + "num_tokens": 161714928.0, + "step": 69100 + }, + { + "epoch": 0.6336297790409828, + "learning_rate": 7.327587787659301e-05, + "loss": 0.7134, + "mean_token_accuracy": 0.7835344433784485, + "num_tokens": 161740248.0, + "step": 69110 + }, + { + "epoch": 0.6337214632804621, + "learning_rate": 7.325754102869718e-05, + "loss": 0.6965, + "mean_token_accuracy": 0.7872528672218323, + "num_tokens": 161765673.0, + "step": 69120 + }, + { + "epoch": 0.6338131475199413, + "learning_rate": 7.323920418080133e-05, + "loss": 0.6927, + "mean_token_accuracy": 0.7904843330383301, + "num_tokens": 161790754.0, + "step": 69130 + }, + { + "epoch": 0.6339048317594206, + "learning_rate": 7.322086733290547e-05, + "loss": 0.6893, + "mean_token_accuracy": 0.7881133913993835, + "num_tokens": 161815418.0, + "step": 69140 + }, + { + "epoch": 0.6339965159988998, + "learning_rate": 7.320253048500963e-05, + "loss": 0.6839, + "mean_token_accuracy": 0.7951958656311036, + "num_tokens": 161840543.0, + "step": 69150 + }, + { + "epoch": 0.634088200238379, + "learning_rate": 7.318419363711379e-05, + "loss": 0.698, + "mean_token_accuracy": 0.7868954122066498, + "num_tokens": 161865723.0, + "step": 69160 + }, + { + "epoch": 0.6341798844778582, + "learning_rate": 7.316585678921794e-05, + "loss": 0.6851, + "mean_token_accuracy": 0.784591406583786, + "num_tokens": 161891569.0, + "step": 69170 + }, + { + "epoch": 0.6342715687173375, + "learning_rate": 7.314751994132209e-05, + "loss": 0.701, + "mean_token_accuracy": 0.7829393804073334, + "num_tokens": 161916715.0, + "step": 69180 + }, + { + "epoch": 0.6343632529568167, + "learning_rate": 7.312918309342624e-05, + "loss": 0.6672, + "mean_token_accuracy": 0.7902737379074096, + "num_tokens": 161942283.0, + "step": 69190 + }, + { + "epoch": 0.634454937196296, + "learning_rate": 7.311084624553039e-05, + "loss": 0.686, + "mean_token_accuracy": 0.7868517696857452, + "num_tokens": 161967333.0, + "step": 69200 + }, + { + "epoch": 0.6345466214357752, + "learning_rate": 7.309250939763454e-05, + "loss": 0.6915, + "mean_token_accuracy": 0.7937543034553528, + "num_tokens": 161991895.0, + "step": 69210 + }, + { + "epoch": 0.6346383056752545, + "learning_rate": 7.307417254973871e-05, + "loss": 0.7008, + "mean_token_accuracy": 0.7821727871894837, + "num_tokens": 162016599.0, + "step": 69220 + }, + { + "epoch": 0.6347299899147336, + "learning_rate": 7.305583570184286e-05, + "loss": 0.7003, + "mean_token_accuracy": 0.7775799095630646, + "num_tokens": 162040683.0, + "step": 69230 + }, + { + "epoch": 0.6348216741542129, + "learning_rate": 7.3037498853947e-05, + "loss": 0.6768, + "mean_token_accuracy": 0.7876672208309173, + "num_tokens": 162065294.0, + "step": 69240 + }, + { + "epoch": 0.6349133583936921, + "learning_rate": 7.301916200605117e-05, + "loss": 0.705, + "mean_token_accuracy": 0.7785340487957001, + "num_tokens": 162091109.0, + "step": 69250 + }, + { + "epoch": 0.6350050426331714, + "learning_rate": 7.300082515815532e-05, + "loss": 0.689, + "mean_token_accuracy": 0.7846271574497223, + "num_tokens": 162116535.0, + "step": 69260 + }, + { + "epoch": 0.6350967268726506, + "learning_rate": 7.298248831025947e-05, + "loss": 0.7037, + "mean_token_accuracy": 0.7866622090339661, + "num_tokens": 162141796.0, + "step": 69270 + }, + { + "epoch": 0.6351884111121299, + "learning_rate": 7.296415146236362e-05, + "loss": 0.6917, + "mean_token_accuracy": 0.7887984454631806, + "num_tokens": 162166980.0, + "step": 69280 + }, + { + "epoch": 0.635280095351609, + "learning_rate": 7.294581461446777e-05, + "loss": 0.7387, + "mean_token_accuracy": 0.7799351513385773, + "num_tokens": 162191990.0, + "step": 69290 + }, + { + "epoch": 0.6353717795910883, + "learning_rate": 7.292747776657193e-05, + "loss": 0.6883, + "mean_token_accuracy": 0.7883966267108917, + "num_tokens": 162216548.0, + "step": 69300 + }, + { + "epoch": 0.6354634638305675, + "learning_rate": 7.290914091867608e-05, + "loss": 0.6486, + "mean_token_accuracy": 0.792574554681778, + "num_tokens": 162241150.0, + "step": 69310 + }, + { + "epoch": 0.6355551480700468, + "learning_rate": 7.289080407078024e-05, + "loss": 0.7235, + "mean_token_accuracy": 0.7742181360721588, + "num_tokens": 162265891.0, + "step": 69320 + }, + { + "epoch": 0.635646832309526, + "learning_rate": 7.28724672228844e-05, + "loss": 0.6605, + "mean_token_accuracy": 0.7921281635761261, + "num_tokens": 162291077.0, + "step": 69330 + }, + { + "epoch": 0.6357385165490053, + "learning_rate": 7.285413037498853e-05, + "loss": 0.6997, + "mean_token_accuracy": 0.7839576721191406, + "num_tokens": 162316990.0, + "step": 69340 + }, + { + "epoch": 0.6358302007884845, + "learning_rate": 7.28357935270927e-05, + "loss": 0.7061, + "mean_token_accuracy": 0.783429092168808, + "num_tokens": 162342798.0, + "step": 69350 + }, + { + "epoch": 0.6359218850279637, + "learning_rate": 7.281745667919685e-05, + "loss": 0.7112, + "mean_token_accuracy": 0.78250093460083, + "num_tokens": 162368283.0, + "step": 69360 + }, + { + "epoch": 0.6360135692674429, + "learning_rate": 7.2799119831301e-05, + "loss": 0.6877, + "mean_token_accuracy": 0.7862596631050109, + "num_tokens": 162394007.0, + "step": 69370 + }, + { + "epoch": 0.6361052535069222, + "learning_rate": 7.278078298340515e-05, + "loss": 0.6973, + "mean_token_accuracy": 0.7891257047653198, + "num_tokens": 162419181.0, + "step": 69380 + }, + { + "epoch": 0.6361969377464014, + "learning_rate": 7.27624461355093e-05, + "loss": 0.7086, + "mean_token_accuracy": 0.781864482164383, + "num_tokens": 162443638.0, + "step": 69390 + }, + { + "epoch": 0.6362886219858807, + "learning_rate": 7.274410928761346e-05, + "loss": 0.7209, + "mean_token_accuracy": 0.7780154645442963, + "num_tokens": 162468992.0, + "step": 69400 + }, + { + "epoch": 0.6363803062253599, + "learning_rate": 7.272577243971762e-05, + "loss": 0.6943, + "mean_token_accuracy": 0.7876321792602539, + "num_tokens": 162494192.0, + "step": 69410 + }, + { + "epoch": 0.636471990464839, + "learning_rate": 7.270743559182177e-05, + "loss": 0.7028, + "mean_token_accuracy": 0.7872909486293793, + "num_tokens": 162519425.0, + "step": 69420 + }, + { + "epoch": 0.6365636747043183, + "learning_rate": 7.268909874392593e-05, + "loss": 0.6848, + "mean_token_accuracy": 0.7924340188503265, + "num_tokens": 162544628.0, + "step": 69430 + }, + { + "epoch": 0.6366553589437975, + "learning_rate": 7.267076189603006e-05, + "loss": 0.6849, + "mean_token_accuracy": 0.7920091986656189, + "num_tokens": 162568395.0, + "step": 69440 + }, + { + "epoch": 0.6367470431832768, + "learning_rate": 7.265242504813423e-05, + "loss": 0.6947, + "mean_token_accuracy": 0.7834534525871277, + "num_tokens": 162593796.0, + "step": 69450 + }, + { + "epoch": 0.636838727422756, + "learning_rate": 7.263408820023838e-05, + "loss": 0.6645, + "mean_token_accuracy": 0.797721940279007, + "num_tokens": 162619053.0, + "step": 69460 + }, + { + "epoch": 0.6369304116622353, + "learning_rate": 7.261575135234253e-05, + "loss": 0.6644, + "mean_token_accuracy": 0.7965146541595459, + "num_tokens": 162644492.0, + "step": 69470 + }, + { + "epoch": 0.6370220959017145, + "learning_rate": 7.259741450444669e-05, + "loss": 0.6738, + "mean_token_accuracy": 0.7905985891819001, + "num_tokens": 162669467.0, + "step": 69480 + }, + { + "epoch": 0.6371137801411937, + "learning_rate": 7.257907765655084e-05, + "loss": 0.6799, + "mean_token_accuracy": 0.7942047357559204, + "num_tokens": 162695123.0, + "step": 69490 + }, + { + "epoch": 0.6372054643806729, + "learning_rate": 7.256074080865499e-05, + "loss": 0.6727, + "mean_token_accuracy": 0.7896474719047546, + "num_tokens": 162720720.0, + "step": 69500 + }, + { + "epoch": 0.6372971486201522, + "learning_rate": 7.254240396075916e-05, + "loss": 0.6833, + "mean_token_accuracy": 0.7888857007026673, + "num_tokens": 162745373.0, + "step": 69510 + }, + { + "epoch": 0.6373888328596314, + "learning_rate": 7.252406711286331e-05, + "loss": 0.6733, + "mean_token_accuracy": 0.7865135848522187, + "num_tokens": 162770538.0, + "step": 69520 + }, + { + "epoch": 0.6374805170991107, + "learning_rate": 7.250573026496746e-05, + "loss": 0.6924, + "mean_token_accuracy": 0.7909885168075561, + "num_tokens": 162795895.0, + "step": 69530 + }, + { + "epoch": 0.6375722013385899, + "learning_rate": 7.248739341707161e-05, + "loss": 0.6288, + "mean_token_accuracy": 0.8023481726646423, + "num_tokens": 162820899.0, + "step": 69540 + }, + { + "epoch": 0.6376638855780691, + "learning_rate": 7.246905656917576e-05, + "loss": 0.702, + "mean_token_accuracy": 0.7822565495967865, + "num_tokens": 162845891.0, + "step": 69550 + }, + { + "epoch": 0.6377555698175483, + "learning_rate": 7.245071972127991e-05, + "loss": 0.704, + "mean_token_accuracy": 0.7825054824352264, + "num_tokens": 162870929.0, + "step": 69560 + }, + { + "epoch": 0.6378472540570276, + "learning_rate": 7.243238287338407e-05, + "loss": 0.7278, + "mean_token_accuracy": 0.7798559546470643, + "num_tokens": 162896226.0, + "step": 69570 + }, + { + "epoch": 0.6379389382965068, + "learning_rate": 7.241404602548822e-05, + "loss": 0.6883, + "mean_token_accuracy": 0.7871682465076446, + "num_tokens": 162921594.0, + "step": 69580 + }, + { + "epoch": 0.6380306225359861, + "learning_rate": 7.239570917759237e-05, + "loss": 0.6872, + "mean_token_accuracy": 0.7882108747959137, + "num_tokens": 162946831.0, + "step": 69590 + }, + { + "epoch": 0.6381223067754653, + "learning_rate": 7.237737232969652e-05, + "loss": 0.7041, + "mean_token_accuracy": 0.7825108349323273, + "num_tokens": 162971362.0, + "step": 69600 + }, + { + "epoch": 0.6382139910149446, + "learning_rate": 7.235903548180069e-05, + "loss": 0.6391, + "mean_token_accuracy": 0.8007571935653687, + "num_tokens": 162996368.0, + "step": 69610 + }, + { + "epoch": 0.6383056752544237, + "learning_rate": 7.234069863390484e-05, + "loss": 0.6606, + "mean_token_accuracy": 0.7967602014541626, + "num_tokens": 163021712.0, + "step": 69620 + }, + { + "epoch": 0.638397359493903, + "learning_rate": 7.232236178600899e-05, + "loss": 0.7315, + "mean_token_accuracy": 0.7771764993667603, + "num_tokens": 163047131.0, + "step": 69630 + }, + { + "epoch": 0.6384890437333822, + "learning_rate": 7.230402493811314e-05, + "loss": 0.6885, + "mean_token_accuracy": 0.7899558424949646, + "num_tokens": 163072048.0, + "step": 69640 + }, + { + "epoch": 0.6385807279728615, + "learning_rate": 7.22856880902173e-05, + "loss": 0.6825, + "mean_token_accuracy": 0.7926486611366272, + "num_tokens": 163098353.0, + "step": 69650 + }, + { + "epoch": 0.6386724122123407, + "learning_rate": 7.226735124232145e-05, + "loss": 0.6799, + "mean_token_accuracy": 0.7868564188480377, + "num_tokens": 163123366.0, + "step": 69660 + }, + { + "epoch": 0.63876409645182, + "learning_rate": 7.224901439442561e-05, + "loss": 0.6733, + "mean_token_accuracy": 0.7880558729171753, + "num_tokens": 163148302.0, + "step": 69670 + }, + { + "epoch": 0.6388557806912991, + "learning_rate": 7.223067754652975e-05, + "loss": 0.6666, + "mean_token_accuracy": 0.790253871679306, + "num_tokens": 163173824.0, + "step": 69680 + }, + { + "epoch": 0.6389474649307784, + "learning_rate": 7.22123406986339e-05, + "loss": 0.668, + "mean_token_accuracy": 0.7905177235603332, + "num_tokens": 163198651.0, + "step": 69690 + }, + { + "epoch": 0.6390391491702576, + "learning_rate": 7.219400385073805e-05, + "loss": 0.667, + "mean_token_accuracy": 0.7918867409229279, + "num_tokens": 163224308.0, + "step": 69700 + }, + { + "epoch": 0.6391308334097369, + "learning_rate": 7.217566700284222e-05, + "loss": 0.6939, + "mean_token_accuracy": 0.7851086556911469, + "num_tokens": 163249267.0, + "step": 69710 + }, + { + "epoch": 0.6392225176492161, + "learning_rate": 7.215733015494637e-05, + "loss": 0.6415, + "mean_token_accuracy": 0.7975740432739258, + "num_tokens": 163274410.0, + "step": 69720 + }, + { + "epoch": 0.6393142018886954, + "learning_rate": 7.213899330705052e-05, + "loss": 0.6817, + "mean_token_accuracy": 0.7886723101139068, + "num_tokens": 163298932.0, + "step": 69730 + }, + { + "epoch": 0.6394058861281746, + "learning_rate": 7.212065645915468e-05, + "loss": 0.6715, + "mean_token_accuracy": 0.7912049293518066, + "num_tokens": 163323643.0, + "step": 69740 + }, + { + "epoch": 0.6394975703676538, + "learning_rate": 7.210231961125883e-05, + "loss": 0.6816, + "mean_token_accuracy": 0.7898310422897339, + "num_tokens": 163348119.0, + "step": 69750 + }, + { + "epoch": 0.639589254607133, + "learning_rate": 7.208398276336298e-05, + "loss": 0.6608, + "mean_token_accuracy": 0.7954709529876709, + "num_tokens": 163373166.0, + "step": 69760 + }, + { + "epoch": 0.6396809388466123, + "learning_rate": 7.206564591546714e-05, + "loss": 0.6933, + "mean_token_accuracy": 0.7857273757457733, + "num_tokens": 163397935.0, + "step": 69770 + }, + { + "epoch": 0.6397726230860915, + "learning_rate": 7.204730906757128e-05, + "loss": 0.6548, + "mean_token_accuracy": 0.7971982300281525, + "num_tokens": 163421941.0, + "step": 69780 + }, + { + "epoch": 0.6398643073255708, + "learning_rate": 7.202897221967543e-05, + "loss": 0.7096, + "mean_token_accuracy": 0.7826210558414459, + "num_tokens": 163446731.0, + "step": 69790 + }, + { + "epoch": 0.63995599156505, + "learning_rate": 7.20106353717796e-05, + "loss": 0.6814, + "mean_token_accuracy": 0.7860031604766846, + "num_tokens": 163472067.0, + "step": 69800 + }, + { + "epoch": 0.6400476758045291, + "learning_rate": 7.199229852388375e-05, + "loss": 0.6937, + "mean_token_accuracy": 0.785373193025589, + "num_tokens": 163496986.0, + "step": 69810 + }, + { + "epoch": 0.6401393600440084, + "learning_rate": 7.19739616759879e-05, + "loss": 0.6741, + "mean_token_accuracy": 0.7898578107357025, + "num_tokens": 163521793.0, + "step": 69820 + }, + { + "epoch": 0.6402310442834876, + "learning_rate": 7.195562482809206e-05, + "loss": 0.6911, + "mean_token_accuracy": 0.7895965039730072, + "num_tokens": 163546456.0, + "step": 69830 + }, + { + "epoch": 0.6403227285229669, + "learning_rate": 7.193728798019621e-05, + "loss": 0.7088, + "mean_token_accuracy": 0.7853328108787536, + "num_tokens": 163571253.0, + "step": 69840 + }, + { + "epoch": 0.6404144127624462, + "learning_rate": 7.191895113230036e-05, + "loss": 0.6655, + "mean_token_accuracy": 0.7966778159141541, + "num_tokens": 163595905.0, + "step": 69850 + }, + { + "epoch": 0.6405060970019254, + "learning_rate": 7.190061428440451e-05, + "loss": 0.7084, + "mean_token_accuracy": 0.7869901061058044, + "num_tokens": 163620350.0, + "step": 69860 + }, + { + "epoch": 0.6405977812414047, + "learning_rate": 7.188227743650868e-05, + "loss": 0.6574, + "mean_token_accuracy": 0.8003265202045441, + "num_tokens": 163646068.0, + "step": 69870 + }, + { + "epoch": 0.6406894654808838, + "learning_rate": 7.186394058861281e-05, + "loss": 0.7159, + "mean_token_accuracy": 0.7857119798660278, + "num_tokens": 163670436.0, + "step": 69880 + }, + { + "epoch": 0.640781149720363, + "learning_rate": 7.184560374071697e-05, + "loss": 0.6487, + "mean_token_accuracy": 0.7965015709400177, + "num_tokens": 163695026.0, + "step": 69890 + }, + { + "epoch": 0.6408728339598423, + "learning_rate": 7.182726689282113e-05, + "loss": 0.7274, + "mean_token_accuracy": 0.7822119891643524, + "num_tokens": 163720320.0, + "step": 69900 + }, + { + "epoch": 0.6409645181993215, + "learning_rate": 7.180893004492528e-05, + "loss": 0.6724, + "mean_token_accuracy": 0.7920660018920899, + "num_tokens": 163745511.0, + "step": 69910 + }, + { + "epoch": 0.6410562024388008, + "learning_rate": 7.179059319702944e-05, + "loss": 0.6887, + "mean_token_accuracy": 0.7868866443634033, + "num_tokens": 163770241.0, + "step": 69920 + }, + { + "epoch": 0.64114788667828, + "learning_rate": 7.177225634913359e-05, + "loss": 0.7023, + "mean_token_accuracy": 0.7846464157104492, + "num_tokens": 163795652.0, + "step": 69930 + }, + { + "epoch": 0.6412395709177592, + "learning_rate": 7.175391950123774e-05, + "loss": 0.6881, + "mean_token_accuracy": 0.7887941777706147, + "num_tokens": 163821072.0, + "step": 69940 + }, + { + "epoch": 0.6413312551572384, + "learning_rate": 7.173558265334189e-05, + "loss": 0.7063, + "mean_token_accuracy": 0.7892722904682159, + "num_tokens": 163845565.0, + "step": 69950 + }, + { + "epoch": 0.6414229393967177, + "learning_rate": 7.171724580544604e-05, + "loss": 0.6867, + "mean_token_accuracy": 0.7910989046096801, + "num_tokens": 163870863.0, + "step": 69960 + }, + { + "epoch": 0.6415146236361969, + "learning_rate": 7.169890895755021e-05, + "loss": 0.7035, + "mean_token_accuracy": 0.7852825403213501, + "num_tokens": 163896814.0, + "step": 69970 + }, + { + "epoch": 0.6416063078756762, + "learning_rate": 7.168057210965435e-05, + "loss": 0.7216, + "mean_token_accuracy": 0.782462191581726, + "num_tokens": 163921146.0, + "step": 69980 + }, + { + "epoch": 0.6416979921151554, + "learning_rate": 7.16622352617585e-05, + "loss": 0.6836, + "mean_token_accuracy": 0.7861079633235931, + "num_tokens": 163945924.0, + "step": 69990 + }, + { + "epoch": 0.6417896763546347, + "learning_rate": 7.164389841386266e-05, + "loss": 0.7098, + "mean_token_accuracy": 0.7870415568351745, + "num_tokens": 163971537.0, + "step": 70000 + }, + { + "epoch": 0.6418813605941138, + "learning_rate": 7.162556156596682e-05, + "loss": 0.6903, + "mean_token_accuracy": 0.7880664765834808, + "num_tokens": 163996861.0, + "step": 70010 + }, + { + "epoch": 0.6419730448335931, + "learning_rate": 7.160722471807097e-05, + "loss": 0.6748, + "mean_token_accuracy": 0.7970955908298493, + "num_tokens": 164021869.0, + "step": 70020 + }, + { + "epoch": 0.6420647290730723, + "learning_rate": 7.158888787017512e-05, + "loss": 0.7076, + "mean_token_accuracy": 0.7810359179973603, + "num_tokens": 164046334.0, + "step": 70030 + }, + { + "epoch": 0.6421564133125516, + "learning_rate": 7.157055102227927e-05, + "loss": 0.6875, + "mean_token_accuracy": 0.7882570087909698, + "num_tokens": 164071630.0, + "step": 70040 + }, + { + "epoch": 0.6422480975520308, + "learning_rate": 7.155221417438342e-05, + "loss": 0.7018, + "mean_token_accuracy": 0.7878653764724731, + "num_tokens": 164096558.0, + "step": 70050 + }, + { + "epoch": 0.6423397817915101, + "learning_rate": 7.153387732648758e-05, + "loss": 0.7, + "mean_token_accuracy": 0.789144092798233, + "num_tokens": 164121370.0, + "step": 70060 + }, + { + "epoch": 0.6424314660309892, + "learning_rate": 7.151554047859174e-05, + "loss": 0.7039, + "mean_token_accuracy": 0.7815370678901672, + "num_tokens": 164146028.0, + "step": 70070 + }, + { + "epoch": 0.6425231502704685, + "learning_rate": 7.149720363069588e-05, + "loss": 0.6586, + "mean_token_accuracy": 0.7944897234439849, + "num_tokens": 164171710.0, + "step": 70080 + }, + { + "epoch": 0.6426148345099477, + "learning_rate": 7.147886678280003e-05, + "loss": 0.686, + "mean_token_accuracy": 0.791346150636673, + "num_tokens": 164196602.0, + "step": 70090 + }, + { + "epoch": 0.642706518749427, + "learning_rate": 7.14605299349042e-05, + "loss": 0.6627, + "mean_token_accuracy": 0.7907776772975922, + "num_tokens": 164221491.0, + "step": 70100 + }, + { + "epoch": 0.6427982029889062, + "learning_rate": 7.144219308700835e-05, + "loss": 0.6898, + "mean_token_accuracy": 0.7849031150341034, + "num_tokens": 164247459.0, + "step": 70110 + }, + { + "epoch": 0.6428898872283855, + "learning_rate": 7.14238562391125e-05, + "loss": 0.6696, + "mean_token_accuracy": 0.791460645198822, + "num_tokens": 164272549.0, + "step": 70120 + }, + { + "epoch": 0.6429815714678647, + "learning_rate": 7.140551939121665e-05, + "loss": 0.7107, + "mean_token_accuracy": 0.7802798926830292, + "num_tokens": 164297250.0, + "step": 70130 + }, + { + "epoch": 0.6430732557073439, + "learning_rate": 7.13871825433208e-05, + "loss": 0.6954, + "mean_token_accuracy": 0.7885702729225159, + "num_tokens": 164322338.0, + "step": 70140 + }, + { + "epoch": 0.6431649399468231, + "learning_rate": 7.136884569542496e-05, + "loss": 0.6853, + "mean_token_accuracy": 0.7821885645389557, + "num_tokens": 164347431.0, + "step": 70150 + }, + { + "epoch": 0.6432566241863024, + "learning_rate": 7.135050884752912e-05, + "loss": 0.6653, + "mean_token_accuracy": 0.8017870903015136, + "num_tokens": 164372925.0, + "step": 70160 + }, + { + "epoch": 0.6433483084257816, + "learning_rate": 7.133217199963327e-05, + "loss": 0.6349, + "mean_token_accuracy": 0.8037239968776703, + "num_tokens": 164397533.0, + "step": 70170 + }, + { + "epoch": 0.6434399926652609, + "learning_rate": 7.131383515173741e-05, + "loss": 0.727, + "mean_token_accuracy": 0.783105605840683, + "num_tokens": 164422345.0, + "step": 70180 + }, + { + "epoch": 0.6435316769047401, + "learning_rate": 7.129549830384156e-05, + "loss": 0.6989, + "mean_token_accuracy": 0.7893296658992768, + "num_tokens": 164446832.0, + "step": 70190 + }, + { + "epoch": 0.6436233611442194, + "learning_rate": 7.127716145594573e-05, + "loss": 0.6495, + "mean_token_accuracy": 0.7958596587181092, + "num_tokens": 164471346.0, + "step": 70200 + }, + { + "epoch": 0.6437150453836985, + "learning_rate": 7.125882460804988e-05, + "loss": 0.702, + "mean_token_accuracy": 0.7869407355785369, + "num_tokens": 164496920.0, + "step": 70210 + }, + { + "epoch": 0.6438067296231778, + "learning_rate": 7.124048776015403e-05, + "loss": 0.6865, + "mean_token_accuracy": 0.7850927472114563, + "num_tokens": 164522293.0, + "step": 70220 + }, + { + "epoch": 0.643898413862657, + "learning_rate": 7.122215091225818e-05, + "loss": 0.6742, + "mean_token_accuracy": 0.7899061143398285, + "num_tokens": 164547079.0, + "step": 70230 + }, + { + "epoch": 0.6439900981021363, + "learning_rate": 7.120381406436234e-05, + "loss": 0.7058, + "mean_token_accuracy": 0.784560638666153, + "num_tokens": 164572493.0, + "step": 70240 + }, + { + "epoch": 0.6440817823416155, + "learning_rate": 7.118547721646649e-05, + "loss": 0.7132, + "mean_token_accuracy": 0.7789095997810364, + "num_tokens": 164597930.0, + "step": 70250 + }, + { + "epoch": 0.6441734665810948, + "learning_rate": 7.116714036857065e-05, + "loss": 0.6685, + "mean_token_accuracy": 0.792503434419632, + "num_tokens": 164622996.0, + "step": 70260 + }, + { + "epoch": 0.6442651508205739, + "learning_rate": 7.11488035206748e-05, + "loss": 0.6744, + "mean_token_accuracy": 0.7918026268482208, + "num_tokens": 164648448.0, + "step": 70270 + }, + { + "epoch": 0.6443568350600531, + "learning_rate": 7.113046667277894e-05, + "loss": 0.6697, + "mean_token_accuracy": 0.7937646448612213, + "num_tokens": 164673196.0, + "step": 70280 + }, + { + "epoch": 0.6444485192995324, + "learning_rate": 7.111212982488311e-05, + "loss": 0.711, + "mean_token_accuracy": 0.7829077959060669, + "num_tokens": 164698768.0, + "step": 70290 + }, + { + "epoch": 0.6445402035390116, + "learning_rate": 7.109379297698726e-05, + "loss": 0.6682, + "mean_token_accuracy": 0.7933432757854462, + "num_tokens": 164723369.0, + "step": 70300 + }, + { + "epoch": 0.6446318877784909, + "learning_rate": 7.107545612909141e-05, + "loss": 0.6743, + "mean_token_accuracy": 0.7898480892181396, + "num_tokens": 164748588.0, + "step": 70310 + }, + { + "epoch": 0.6447235720179701, + "learning_rate": 7.105711928119556e-05, + "loss": 0.7369, + "mean_token_accuracy": 0.7723786234855652, + "num_tokens": 164773080.0, + "step": 70320 + }, + { + "epoch": 0.6448152562574494, + "learning_rate": 7.103878243329972e-05, + "loss": 0.6946, + "mean_token_accuracy": 0.7824502050876617, + "num_tokens": 164798200.0, + "step": 70330 + }, + { + "epoch": 0.6449069404969285, + "learning_rate": 7.102044558540387e-05, + "loss": 0.6517, + "mean_token_accuracy": 0.8015531122684478, + "num_tokens": 164823234.0, + "step": 70340 + }, + { + "epoch": 0.6449986247364078, + "learning_rate": 7.100210873750802e-05, + "loss": 0.6791, + "mean_token_accuracy": 0.7885856449604034, + "num_tokens": 164848631.0, + "step": 70350 + }, + { + "epoch": 0.645090308975887, + "learning_rate": 7.098377188961219e-05, + "loss": 0.682, + "mean_token_accuracy": 0.7893922865390778, + "num_tokens": 164874434.0, + "step": 70360 + }, + { + "epoch": 0.6451819932153663, + "learning_rate": 7.096543504171634e-05, + "loss": 0.6924, + "mean_token_accuracy": 0.7901115536689758, + "num_tokens": 164899874.0, + "step": 70370 + }, + { + "epoch": 0.6452736774548455, + "learning_rate": 7.094709819382048e-05, + "loss": 0.6939, + "mean_token_accuracy": 0.7853074848651886, + "num_tokens": 164925257.0, + "step": 70380 + }, + { + "epoch": 0.6453653616943248, + "learning_rate": 7.092876134592464e-05, + "loss": 0.6707, + "mean_token_accuracy": 0.7973959863185882, + "num_tokens": 164950537.0, + "step": 70390 + }, + { + "epoch": 0.6454570459338039, + "learning_rate": 7.09104244980288e-05, + "loss": 0.7193, + "mean_token_accuracy": 0.7829456925392151, + "num_tokens": 164975172.0, + "step": 70400 + }, + { + "epoch": 0.6455487301732832, + "learning_rate": 7.089208765013295e-05, + "loss": 0.6875, + "mean_token_accuracy": 0.7823552489280701, + "num_tokens": 164999525.0, + "step": 70410 + }, + { + "epoch": 0.6456404144127624, + "learning_rate": 7.08737508022371e-05, + "loss": 0.6499, + "mean_token_accuracy": 0.7994419276714325, + "num_tokens": 165023937.0, + "step": 70420 + }, + { + "epoch": 0.6457320986522417, + "learning_rate": 7.085541395434125e-05, + "loss": 0.6969, + "mean_token_accuracy": 0.7814277410507202, + "num_tokens": 165049014.0, + "step": 70430 + }, + { + "epoch": 0.6458237828917209, + "learning_rate": 7.08370771064454e-05, + "loss": 0.6853, + "mean_token_accuracy": 0.78925821185112, + "num_tokens": 165074552.0, + "step": 70440 + }, + { + "epoch": 0.6459154671312002, + "learning_rate": 7.081874025854955e-05, + "loss": 0.6807, + "mean_token_accuracy": 0.7904388070106506, + "num_tokens": 165100461.0, + "step": 70450 + }, + { + "epoch": 0.6460071513706794, + "learning_rate": 7.080040341065372e-05, + "loss": 0.6764, + "mean_token_accuracy": 0.7925844073295594, + "num_tokens": 165125147.0, + "step": 70460 + }, + { + "epoch": 0.6460988356101586, + "learning_rate": 7.078206656275787e-05, + "loss": 0.6826, + "mean_token_accuracy": 0.7928273975849152, + "num_tokens": 165150882.0, + "step": 70470 + }, + { + "epoch": 0.6461905198496378, + "learning_rate": 7.076372971486201e-05, + "loss": 0.709, + "mean_token_accuracy": 0.7848760843276977, + "num_tokens": 165175879.0, + "step": 70480 + }, + { + "epoch": 0.6462822040891171, + "learning_rate": 7.074539286696617e-05, + "loss": 0.683, + "mean_token_accuracy": 0.7861987471580505, + "num_tokens": 165200599.0, + "step": 70490 + }, + { + "epoch": 0.6463738883285963, + "learning_rate": 7.072705601907033e-05, + "loss": 0.6658, + "mean_token_accuracy": 0.7930368661880494, + "num_tokens": 165225446.0, + "step": 70500 + }, + { + "epoch": 0.6464655725680756, + "learning_rate": 7.070871917117448e-05, + "loss": 0.7041, + "mean_token_accuracy": 0.7830127954483033, + "num_tokens": 165250007.0, + "step": 70510 + }, + { + "epoch": 0.6465572568075548, + "learning_rate": 7.069038232327864e-05, + "loss": 0.6522, + "mean_token_accuracy": 0.8032989382743836, + "num_tokens": 165275395.0, + "step": 70520 + }, + { + "epoch": 0.646648941047034, + "learning_rate": 7.067204547538278e-05, + "loss": 0.6512, + "mean_token_accuracy": 0.7982889413833618, + "num_tokens": 165300461.0, + "step": 70530 + }, + { + "epoch": 0.6467406252865132, + "learning_rate": 7.065370862748693e-05, + "loss": 0.7155, + "mean_token_accuracy": 0.7819724440574646, + "num_tokens": 165326376.0, + "step": 70540 + }, + { + "epoch": 0.6468323095259925, + "learning_rate": 7.063537177959108e-05, + "loss": 0.66, + "mean_token_accuracy": 0.7927281200885773, + "num_tokens": 165350624.0, + "step": 70550 + }, + { + "epoch": 0.6469239937654717, + "learning_rate": 7.061703493169525e-05, + "loss": 0.724, + "mean_token_accuracy": 0.7824005544185638, + "num_tokens": 165376460.0, + "step": 70560 + }, + { + "epoch": 0.647015678004951, + "learning_rate": 7.05986980837994e-05, + "loss": 0.7089, + "mean_token_accuracy": 0.7911057472229004, + "num_tokens": 165401361.0, + "step": 70570 + }, + { + "epoch": 0.6471073622444302, + "learning_rate": 7.058036123590354e-05, + "loss": 0.6926, + "mean_token_accuracy": 0.7916284382343293, + "num_tokens": 165426545.0, + "step": 70580 + }, + { + "epoch": 0.6471990464839095, + "learning_rate": 7.05620243880077e-05, + "loss": 0.6768, + "mean_token_accuracy": 0.7930202126502991, + "num_tokens": 165452458.0, + "step": 70590 + }, + { + "epoch": 0.6472907307233886, + "learning_rate": 7.054368754011186e-05, + "loss": 0.6907, + "mean_token_accuracy": 0.7872883677482605, + "num_tokens": 165477343.0, + "step": 70600 + }, + { + "epoch": 0.6473824149628679, + "learning_rate": 7.052535069221601e-05, + "loss": 0.6591, + "mean_token_accuracy": 0.7991599798202514, + "num_tokens": 165502586.0, + "step": 70610 + }, + { + "epoch": 0.6474740992023471, + "learning_rate": 7.050701384432018e-05, + "loss": 0.6798, + "mean_token_accuracy": 0.7952367842197419, + "num_tokens": 165528173.0, + "step": 70620 + }, + { + "epoch": 0.6475657834418264, + "learning_rate": 7.048867699642431e-05, + "loss": 0.7125, + "mean_token_accuracy": 0.7836075901985169, + "num_tokens": 165553877.0, + "step": 70630 + }, + { + "epoch": 0.6476574676813056, + "learning_rate": 7.047034014852847e-05, + "loss": 0.6684, + "mean_token_accuracy": 0.7939449429512024, + "num_tokens": 165578955.0, + "step": 70640 + }, + { + "epoch": 0.6477491519207849, + "learning_rate": 7.045200330063263e-05, + "loss": 0.6966, + "mean_token_accuracy": 0.7831183791160583, + "num_tokens": 165603439.0, + "step": 70650 + }, + { + "epoch": 0.647840836160264, + "learning_rate": 7.043366645273678e-05, + "loss": 0.6888, + "mean_token_accuracy": 0.7874828219413758, + "num_tokens": 165629096.0, + "step": 70660 + }, + { + "epoch": 0.6479325203997433, + "learning_rate": 7.041532960484093e-05, + "loss": 0.6739, + "mean_token_accuracy": 0.7955126941204071, + "num_tokens": 165654003.0, + "step": 70670 + }, + { + "epoch": 0.6480242046392225, + "learning_rate": 7.039699275694507e-05, + "loss": 0.7204, + "mean_token_accuracy": 0.7809175372123718, + "num_tokens": 165679006.0, + "step": 70680 + }, + { + "epoch": 0.6481158888787018, + "learning_rate": 7.037865590904924e-05, + "loss": 0.7067, + "mean_token_accuracy": 0.7847817420959473, + "num_tokens": 165704266.0, + "step": 70690 + }, + { + "epoch": 0.648207573118181, + "learning_rate": 7.036031906115339e-05, + "loss": 0.6784, + "mean_token_accuracy": 0.7917144119739532, + "num_tokens": 165729847.0, + "step": 70700 + }, + { + "epoch": 0.6482992573576603, + "learning_rate": 7.034198221325754e-05, + "loss": 0.6837, + "mean_token_accuracy": 0.7914392411708832, + "num_tokens": 165754422.0, + "step": 70710 + }, + { + "epoch": 0.6483909415971395, + "learning_rate": 7.032364536536171e-05, + "loss": 0.6869, + "mean_token_accuracy": 0.7832569360733033, + "num_tokens": 165779794.0, + "step": 70720 + }, + { + "epoch": 0.6484826258366186, + "learning_rate": 7.030530851746585e-05, + "loss": 0.6676, + "mean_token_accuracy": 0.7912835299968719, + "num_tokens": 165804790.0, + "step": 70730 + }, + { + "epoch": 0.6485743100760979, + "learning_rate": 7.028697166957e-05, + "loss": 0.6849, + "mean_token_accuracy": 0.7877888083457947, + "num_tokens": 165830531.0, + "step": 70740 + }, + { + "epoch": 0.6486659943155771, + "learning_rate": 7.026863482167416e-05, + "loss": 0.6765, + "mean_token_accuracy": 0.7906343519687653, + "num_tokens": 165854608.0, + "step": 70750 + }, + { + "epoch": 0.6487576785550564, + "learning_rate": 7.025029797377831e-05, + "loss": 0.644, + "mean_token_accuracy": 0.799230980873108, + "num_tokens": 165879234.0, + "step": 70760 + }, + { + "epoch": 0.6488493627945356, + "learning_rate": 7.023196112588247e-05, + "loss": 0.6963, + "mean_token_accuracy": 0.7899213194847107, + "num_tokens": 165904263.0, + "step": 70770 + }, + { + "epoch": 0.6489410470340149, + "learning_rate": 7.021362427798662e-05, + "loss": 0.6655, + "mean_token_accuracy": 0.7973266541957855, + "num_tokens": 165928833.0, + "step": 70780 + }, + { + "epoch": 0.649032731273494, + "learning_rate": 7.019528743009077e-05, + "loss": 0.6969, + "mean_token_accuracy": 0.7848142504692077, + "num_tokens": 165953955.0, + "step": 70790 + }, + { + "epoch": 0.6491244155129733, + "learning_rate": 7.017695058219492e-05, + "loss": 0.6976, + "mean_token_accuracy": 0.7819412648677826, + "num_tokens": 165980016.0, + "step": 70800 + }, + { + "epoch": 0.6492160997524525, + "learning_rate": 7.015861373429907e-05, + "loss": 0.6747, + "mean_token_accuracy": 0.7877288699150086, + "num_tokens": 166004857.0, + "step": 70810 + }, + { + "epoch": 0.6493077839919318, + "learning_rate": 7.014027688640324e-05, + "loss": 0.6749, + "mean_token_accuracy": 0.7964017391204834, + "num_tokens": 166030057.0, + "step": 70820 + }, + { + "epoch": 0.649399468231411, + "learning_rate": 7.012194003850738e-05, + "loss": 0.6931, + "mean_token_accuracy": 0.7858947098255158, + "num_tokens": 166055103.0, + "step": 70830 + }, + { + "epoch": 0.6494911524708903, + "learning_rate": 7.010360319061153e-05, + "loss": 0.6935, + "mean_token_accuracy": 0.7834270834922791, + "num_tokens": 166079202.0, + "step": 70840 + }, + { + "epoch": 0.6495828367103695, + "learning_rate": 7.00852663427157e-05, + "loss": 0.6896, + "mean_token_accuracy": 0.7870459735393525, + "num_tokens": 166104363.0, + "step": 70850 + }, + { + "epoch": 0.6496745209498487, + "learning_rate": 7.006692949481985e-05, + "loss": 0.6816, + "mean_token_accuracy": 0.7928813815116882, + "num_tokens": 166129539.0, + "step": 70860 + }, + { + "epoch": 0.6497662051893279, + "learning_rate": 7.0048592646924e-05, + "loss": 0.6732, + "mean_token_accuracy": 0.7869620025157928, + "num_tokens": 166155118.0, + "step": 70870 + }, + { + "epoch": 0.6498578894288072, + "learning_rate": 7.003025579902815e-05, + "loss": 0.6416, + "mean_token_accuracy": 0.7994863152503967, + "num_tokens": 166180039.0, + "step": 70880 + }, + { + "epoch": 0.6499495736682864, + "learning_rate": 7.00119189511323e-05, + "loss": 0.7179, + "mean_token_accuracy": 0.7806203186511993, + "num_tokens": 166205355.0, + "step": 70890 + }, + { + "epoch": 0.6500412579077657, + "learning_rate": 6.999358210323645e-05, + "loss": 0.7008, + "mean_token_accuracy": 0.7929344296455383, + "num_tokens": 166230529.0, + "step": 70900 + }, + { + "epoch": 0.6501329421472449, + "learning_rate": 6.997524525534062e-05, + "loss": 0.683, + "mean_token_accuracy": 0.787913191318512, + "num_tokens": 166255023.0, + "step": 70910 + }, + { + "epoch": 0.6502246263867241, + "learning_rate": 6.995690840744477e-05, + "loss": 0.6415, + "mean_token_accuracy": 0.8023931086063385, + "num_tokens": 166279792.0, + "step": 70920 + }, + { + "epoch": 0.6503163106262033, + "learning_rate": 6.993857155954891e-05, + "loss": 0.6464, + "mean_token_accuracy": 0.799000597000122, + "num_tokens": 166304000.0, + "step": 70930 + }, + { + "epoch": 0.6504079948656826, + "learning_rate": 6.992023471165306e-05, + "loss": 0.6863, + "mean_token_accuracy": 0.7917823731899262, + "num_tokens": 166328112.0, + "step": 70940 + }, + { + "epoch": 0.6504996791051618, + "learning_rate": 6.990189786375723e-05, + "loss": 0.6656, + "mean_token_accuracy": 0.7906832039356232, + "num_tokens": 166352677.0, + "step": 70950 + }, + { + "epoch": 0.6505913633446411, + "learning_rate": 6.988356101586138e-05, + "loss": 0.6965, + "mean_token_accuracy": 0.7833178222179413, + "num_tokens": 166377524.0, + "step": 70960 + }, + { + "epoch": 0.6506830475841203, + "learning_rate": 6.986522416796553e-05, + "loss": 0.6906, + "mean_token_accuracy": 0.788356339931488, + "num_tokens": 166402176.0, + "step": 70970 + }, + { + "epoch": 0.6507747318235996, + "learning_rate": 6.984688732006968e-05, + "loss": 0.6845, + "mean_token_accuracy": 0.794219434261322, + "num_tokens": 166427401.0, + "step": 70980 + }, + { + "epoch": 0.6508664160630787, + "learning_rate": 6.982855047217383e-05, + "loss": 0.7068, + "mean_token_accuracy": 0.7824733138084412, + "num_tokens": 166452391.0, + "step": 70990 + }, + { + "epoch": 0.650958100302558, + "learning_rate": 6.981021362427799e-05, + "loss": 0.686, + "mean_token_accuracy": 0.7882467329502105, + "num_tokens": 166477223.0, + "step": 71000 + }, + { + "epoch": 0.6510497845420372, + "learning_rate": 6.979187677638215e-05, + "loss": 0.6556, + "mean_token_accuracy": 0.7950958728790283, + "num_tokens": 166503258.0, + "step": 71010 + }, + { + "epoch": 0.6511414687815165, + "learning_rate": 6.97735399284863e-05, + "loss": 0.6748, + "mean_token_accuracy": 0.792359584569931, + "num_tokens": 166528085.0, + "step": 71020 + }, + { + "epoch": 0.6512331530209957, + "learning_rate": 6.975520308059044e-05, + "loss": 0.6988, + "mean_token_accuracy": 0.7834649026393891, + "num_tokens": 166552873.0, + "step": 71030 + }, + { + "epoch": 0.651324837260475, + "learning_rate": 6.97368662326946e-05, + "loss": 0.67, + "mean_token_accuracy": 0.7926984071731568, + "num_tokens": 166579080.0, + "step": 71040 + }, + { + "epoch": 0.6514165214999541, + "learning_rate": 6.971852938479876e-05, + "loss": 0.6876, + "mean_token_accuracy": 0.7916151583194733, + "num_tokens": 166603875.0, + "step": 71050 + }, + { + "epoch": 0.6515082057394334, + "learning_rate": 6.970019253690291e-05, + "loss": 0.6593, + "mean_token_accuracy": 0.7899702608585357, + "num_tokens": 166628752.0, + "step": 71060 + }, + { + "epoch": 0.6515998899789126, + "learning_rate": 6.968185568900706e-05, + "loss": 0.6711, + "mean_token_accuracy": 0.7901023924350739, + "num_tokens": 166653770.0, + "step": 71070 + }, + { + "epoch": 0.6516915742183919, + "learning_rate": 6.966351884111122e-05, + "loss": 0.6928, + "mean_token_accuracy": 0.7889417350292206, + "num_tokens": 166678800.0, + "step": 71080 + }, + { + "epoch": 0.6517832584578711, + "learning_rate": 6.964518199321537e-05, + "loss": 0.6949, + "mean_token_accuracy": 0.7840139269828796, + "num_tokens": 166703608.0, + "step": 71090 + }, + { + "epoch": 0.6518749426973504, + "learning_rate": 6.962684514531952e-05, + "loss": 0.6768, + "mean_token_accuracy": 0.7932865202426911, + "num_tokens": 166728886.0, + "step": 71100 + }, + { + "epoch": 0.6519666269368296, + "learning_rate": 6.960850829742368e-05, + "loss": 0.6754, + "mean_token_accuracy": 0.7885345995426178, + "num_tokens": 166753171.0, + "step": 71110 + }, + { + "epoch": 0.6520583111763087, + "learning_rate": 6.959017144952784e-05, + "loss": 0.6949, + "mean_token_accuracy": 0.7940915107727051, + "num_tokens": 166778699.0, + "step": 71120 + }, + { + "epoch": 0.652149995415788, + "learning_rate": 6.957183460163197e-05, + "loss": 0.696, + "mean_token_accuracy": 0.7829701483249665, + "num_tokens": 166803107.0, + "step": 71130 + }, + { + "epoch": 0.6522416796552672, + "learning_rate": 6.955349775373614e-05, + "loss": 0.6791, + "mean_token_accuracy": 0.7943341434001923, + "num_tokens": 166828711.0, + "step": 71140 + }, + { + "epoch": 0.6523333638947465, + "learning_rate": 6.953516090584029e-05, + "loss": 0.6838, + "mean_token_accuracy": 0.7912250399589539, + "num_tokens": 166853598.0, + "step": 71150 + }, + { + "epoch": 0.6524250481342257, + "learning_rate": 6.951682405794444e-05, + "loss": 0.6956, + "mean_token_accuracy": 0.7875594735145569, + "num_tokens": 166878884.0, + "step": 71160 + }, + { + "epoch": 0.652516732373705, + "learning_rate": 6.94984872100486e-05, + "loss": 0.6711, + "mean_token_accuracy": 0.7966920077800751, + "num_tokens": 166903942.0, + "step": 71170 + }, + { + "epoch": 0.6526084166131841, + "learning_rate": 6.948015036215275e-05, + "loss": 0.6976, + "mean_token_accuracy": 0.7829735338687897, + "num_tokens": 166929442.0, + "step": 71180 + }, + { + "epoch": 0.6527001008526634, + "learning_rate": 6.94618135142569e-05, + "loss": 0.7069, + "mean_token_accuracy": 0.7873943626880646, + "num_tokens": 166955220.0, + "step": 71190 + }, + { + "epoch": 0.6527917850921426, + "learning_rate": 6.944347666636105e-05, + "loss": 0.6779, + "mean_token_accuracy": 0.7900447189807892, + "num_tokens": 166980634.0, + "step": 71200 + }, + { + "epoch": 0.6528834693316219, + "learning_rate": 6.942513981846522e-05, + "loss": 0.6741, + "mean_token_accuracy": 0.7973148584365845, + "num_tokens": 167005237.0, + "step": 71210 + }, + { + "epoch": 0.6529751535711011, + "learning_rate": 6.940680297056937e-05, + "loss": 0.7085, + "mean_token_accuracy": 0.7882147192955017, + "num_tokens": 167030239.0, + "step": 71220 + }, + { + "epoch": 0.6530668378105804, + "learning_rate": 6.93884661226735e-05, + "loss": 0.7009, + "mean_token_accuracy": 0.780734521150589, + "num_tokens": 167055419.0, + "step": 71230 + }, + { + "epoch": 0.6531585220500596, + "learning_rate": 6.937012927477767e-05, + "loss": 0.6623, + "mean_token_accuracy": 0.7908092081546784, + "num_tokens": 167080449.0, + "step": 71240 + }, + { + "epoch": 0.6532502062895388, + "learning_rate": 6.935179242688182e-05, + "loss": 0.7019, + "mean_token_accuracy": 0.7876363217830658, + "num_tokens": 167105462.0, + "step": 71250 + }, + { + "epoch": 0.653341890529018, + "learning_rate": 6.933345557898598e-05, + "loss": 0.7132, + "mean_token_accuracy": 0.7861493468284607, + "num_tokens": 167130952.0, + "step": 71260 + }, + { + "epoch": 0.6534335747684973, + "learning_rate": 6.931511873109013e-05, + "loss": 0.6802, + "mean_token_accuracy": 0.7848678529262543, + "num_tokens": 167156303.0, + "step": 71270 + }, + { + "epoch": 0.6535252590079765, + "learning_rate": 6.929678188319428e-05, + "loss": 0.6602, + "mean_token_accuracy": 0.7955906808376312, + "num_tokens": 167182702.0, + "step": 71280 + }, + { + "epoch": 0.6536169432474558, + "learning_rate": 6.927844503529843e-05, + "loss": 0.6819, + "mean_token_accuracy": 0.794136357307434, + "num_tokens": 167207799.0, + "step": 71290 + }, + { + "epoch": 0.653708627486935, + "learning_rate": 6.926010818740258e-05, + "loss": 0.7208, + "mean_token_accuracy": 0.7786969423294068, + "num_tokens": 167233324.0, + "step": 71300 + }, + { + "epoch": 0.6538003117264142, + "learning_rate": 6.924177133950675e-05, + "loss": 0.726, + "mean_token_accuracy": 0.7827441334724426, + "num_tokens": 167258748.0, + "step": 71310 + }, + { + "epoch": 0.6538919959658934, + "learning_rate": 6.92234344916109e-05, + "loss": 0.6867, + "mean_token_accuracy": 0.7898482620716095, + "num_tokens": 167284325.0, + "step": 71320 + }, + { + "epoch": 0.6539836802053727, + "learning_rate": 6.920509764371504e-05, + "loss": 0.6657, + "mean_token_accuracy": 0.7865634679794311, + "num_tokens": 167310076.0, + "step": 71330 + }, + { + "epoch": 0.6540753644448519, + "learning_rate": 6.91867607958192e-05, + "loss": 0.6725, + "mean_token_accuracy": 0.7915717363357544, + "num_tokens": 167334811.0, + "step": 71340 + }, + { + "epoch": 0.6541670486843312, + "learning_rate": 6.916842394792336e-05, + "loss": 0.6903, + "mean_token_accuracy": 0.7892451882362366, + "num_tokens": 167359807.0, + "step": 71350 + }, + { + "epoch": 0.6542587329238104, + "learning_rate": 6.915008710002751e-05, + "loss": 0.6944, + "mean_token_accuracy": 0.7852569878101349, + "num_tokens": 167385181.0, + "step": 71360 + }, + { + "epoch": 0.6543504171632897, + "learning_rate": 6.913175025213166e-05, + "loss": 0.6771, + "mean_token_accuracy": 0.7882788836956024, + "num_tokens": 167410414.0, + "step": 71370 + }, + { + "epoch": 0.6544421014027688, + "learning_rate": 6.911341340423581e-05, + "loss": 0.6762, + "mean_token_accuracy": 0.7888165235519409, + "num_tokens": 167435843.0, + "step": 71380 + }, + { + "epoch": 0.6545337856422481, + "learning_rate": 6.909507655633996e-05, + "loss": 0.6847, + "mean_token_accuracy": 0.7893908262252808, + "num_tokens": 167461325.0, + "step": 71390 + }, + { + "epoch": 0.6546254698817273, + "learning_rate": 6.907673970844413e-05, + "loss": 0.6957, + "mean_token_accuracy": 0.7918611347675324, + "num_tokens": 167485926.0, + "step": 71400 + }, + { + "epoch": 0.6547171541212066, + "learning_rate": 6.905840286054828e-05, + "loss": 0.6446, + "mean_token_accuracy": 0.7933196544647216, + "num_tokens": 167511660.0, + "step": 71410 + }, + { + "epoch": 0.6548088383606858, + "learning_rate": 6.904006601265243e-05, + "loss": 0.7014, + "mean_token_accuracy": 0.7869983971118927, + "num_tokens": 167536907.0, + "step": 71420 + }, + { + "epoch": 0.6549005226001651, + "learning_rate": 6.902172916475657e-05, + "loss": 0.7259, + "mean_token_accuracy": 0.7848357141017914, + "num_tokens": 167562140.0, + "step": 71430 + }, + { + "epoch": 0.6549922068396443, + "learning_rate": 6.900339231686074e-05, + "loss": 0.6888, + "mean_token_accuracy": 0.7915430128574371, + "num_tokens": 167586248.0, + "step": 71440 + }, + { + "epoch": 0.6550838910791235, + "learning_rate": 6.898505546896489e-05, + "loss": 0.7193, + "mean_token_accuracy": 0.7776082277297973, + "num_tokens": 167611633.0, + "step": 71450 + }, + { + "epoch": 0.6551755753186027, + "learning_rate": 6.896671862106904e-05, + "loss": 0.7026, + "mean_token_accuracy": 0.783545869588852, + "num_tokens": 167636728.0, + "step": 71460 + }, + { + "epoch": 0.655267259558082, + "learning_rate": 6.894838177317319e-05, + "loss": 0.7239, + "mean_token_accuracy": 0.7785880982875824, + "num_tokens": 167661386.0, + "step": 71470 + }, + { + "epoch": 0.6553589437975612, + "learning_rate": 6.893004492527734e-05, + "loss": 0.6606, + "mean_token_accuracy": 0.7987613320350647, + "num_tokens": 167685801.0, + "step": 71480 + }, + { + "epoch": 0.6554506280370405, + "learning_rate": 6.89117080773815e-05, + "loss": 0.6685, + "mean_token_accuracy": 0.792380154132843, + "num_tokens": 167711078.0, + "step": 71490 + }, + { + "epoch": 0.6555423122765197, + "learning_rate": 6.889337122948566e-05, + "loss": 0.6511, + "mean_token_accuracy": 0.7922020494937897, + "num_tokens": 167736759.0, + "step": 71500 + }, + { + "epoch": 0.6556339965159989, + "learning_rate": 6.887503438158981e-05, + "loss": 0.6847, + "mean_token_accuracy": 0.7862393975257873, + "num_tokens": 167761993.0, + "step": 71510 + }, + { + "epoch": 0.6557256807554781, + "learning_rate": 6.885669753369397e-05, + "loss": 0.6569, + "mean_token_accuracy": 0.792601364850998, + "num_tokens": 167786582.0, + "step": 71520 + }, + { + "epoch": 0.6558173649949574, + "learning_rate": 6.883836068579812e-05, + "loss": 0.6876, + "mean_token_accuracy": 0.7875175237655639, + "num_tokens": 167811083.0, + "step": 71530 + }, + { + "epoch": 0.6559090492344366, + "learning_rate": 6.882002383790227e-05, + "loss": 0.672, + "mean_token_accuracy": 0.7888307452201844, + "num_tokens": 167836253.0, + "step": 71540 + }, + { + "epoch": 0.6560007334739159, + "learning_rate": 6.880168699000642e-05, + "loss": 0.6806, + "mean_token_accuracy": 0.790232104063034, + "num_tokens": 167860168.0, + "step": 71550 + }, + { + "epoch": 0.6560924177133951, + "learning_rate": 6.878335014211057e-05, + "loss": 0.7129, + "mean_token_accuracy": 0.7792242765426636, + "num_tokens": 167885750.0, + "step": 71560 + }, + { + "epoch": 0.6561841019528744, + "learning_rate": 6.876501329421472e-05, + "loss": 0.6676, + "mean_token_accuracy": 0.7946697473526001, + "num_tokens": 167911467.0, + "step": 71570 + }, + { + "epoch": 0.6562757861923535, + "learning_rate": 6.874667644631888e-05, + "loss": 0.6715, + "mean_token_accuracy": 0.7902608871459961, + "num_tokens": 167936193.0, + "step": 71580 + }, + { + "epoch": 0.6563674704318327, + "learning_rate": 6.872833959842303e-05, + "loss": 0.6759, + "mean_token_accuracy": 0.792341285943985, + "num_tokens": 167960758.0, + "step": 71590 + }, + { + "epoch": 0.656459154671312, + "learning_rate": 6.87100027505272e-05, + "loss": 0.685, + "mean_token_accuracy": 0.783710652589798, + "num_tokens": 167985686.0, + "step": 71600 + }, + { + "epoch": 0.6565508389107912, + "learning_rate": 6.869166590263135e-05, + "loss": 0.692, + "mean_token_accuracy": 0.8000739336013794, + "num_tokens": 168010472.0, + "step": 71610 + }, + { + "epoch": 0.6566425231502705, + "learning_rate": 6.86733290547355e-05, + "loss": 0.7105, + "mean_token_accuracy": 0.7812987685203552, + "num_tokens": 168035933.0, + "step": 71620 + }, + { + "epoch": 0.6567342073897497, + "learning_rate": 6.865499220683965e-05, + "loss": 0.6906, + "mean_token_accuracy": 0.7924662590026855, + "num_tokens": 168061104.0, + "step": 71630 + }, + { + "epoch": 0.6568258916292289, + "learning_rate": 6.86366553589438e-05, + "loss": 0.6977, + "mean_token_accuracy": 0.7867888748645783, + "num_tokens": 168086657.0, + "step": 71640 + }, + { + "epoch": 0.6569175758687081, + "learning_rate": 6.861831851104795e-05, + "loss": 0.6968, + "mean_token_accuracy": 0.7839610815048218, + "num_tokens": 168112276.0, + "step": 71650 + }, + { + "epoch": 0.6570092601081874, + "learning_rate": 6.85999816631521e-05, + "loss": 0.6925, + "mean_token_accuracy": 0.7872973442077636, + "num_tokens": 168137487.0, + "step": 71660 + }, + { + "epoch": 0.6571009443476666, + "learning_rate": 6.858164481525626e-05, + "loss": 0.6996, + "mean_token_accuracy": 0.7813877284526825, + "num_tokens": 168162714.0, + "step": 71670 + }, + { + "epoch": 0.6571926285871459, + "learning_rate": 6.856330796736041e-05, + "loss": 0.6939, + "mean_token_accuracy": 0.7868259906768799, + "num_tokens": 168186991.0, + "step": 71680 + }, + { + "epoch": 0.6572843128266251, + "learning_rate": 6.854497111946456e-05, + "loss": 0.7375, + "mean_token_accuracy": 0.779875522851944, + "num_tokens": 168212366.0, + "step": 71690 + }, + { + "epoch": 0.6573759970661044, + "learning_rate": 6.852663427156873e-05, + "loss": 0.6823, + "mean_token_accuracy": 0.785092294216156, + "num_tokens": 168237763.0, + "step": 71700 + }, + { + "epoch": 0.6574676813055835, + "learning_rate": 6.850829742367288e-05, + "loss": 0.6756, + "mean_token_accuracy": 0.7955116391181946, + "num_tokens": 168262788.0, + "step": 71710 + }, + { + "epoch": 0.6575593655450628, + "learning_rate": 6.848996057577703e-05, + "loss": 0.656, + "mean_token_accuracy": 0.7953277707099915, + "num_tokens": 168287893.0, + "step": 71720 + }, + { + "epoch": 0.657651049784542, + "learning_rate": 6.847162372788118e-05, + "loss": 0.6541, + "mean_token_accuracy": 0.8006919801235199, + "num_tokens": 168313793.0, + "step": 71730 + }, + { + "epoch": 0.6577427340240213, + "learning_rate": 6.845328687998533e-05, + "loss": 0.6694, + "mean_token_accuracy": 0.7931058228015899, + "num_tokens": 168339033.0, + "step": 71740 + }, + { + "epoch": 0.6578344182635005, + "learning_rate": 6.843495003208949e-05, + "loss": 0.6912, + "mean_token_accuracy": 0.7899622797966004, + "num_tokens": 168363352.0, + "step": 71750 + }, + { + "epoch": 0.6579261025029798, + "learning_rate": 6.841661318419365e-05, + "loss": 0.7138, + "mean_token_accuracy": 0.7756168782711029, + "num_tokens": 168389113.0, + "step": 71760 + }, + { + "epoch": 0.6580177867424589, + "learning_rate": 6.839827633629779e-05, + "loss": 0.6981, + "mean_token_accuracy": 0.7802573800086975, + "num_tokens": 168414002.0, + "step": 71770 + }, + { + "epoch": 0.6581094709819382, + "learning_rate": 6.837993948840194e-05, + "loss": 0.6902, + "mean_token_accuracy": 0.78469517827034, + "num_tokens": 168439569.0, + "step": 71780 + }, + { + "epoch": 0.6582011552214174, + "learning_rate": 6.836160264050609e-05, + "loss": 0.6874, + "mean_token_accuracy": 0.7881043136119843, + "num_tokens": 168464214.0, + "step": 71790 + }, + { + "epoch": 0.6582928394608967, + "learning_rate": 6.834326579261026e-05, + "loss": 0.7062, + "mean_token_accuracy": 0.7843380331993103, + "num_tokens": 168489506.0, + "step": 71800 + }, + { + "epoch": 0.6583845237003759, + "learning_rate": 6.832492894471441e-05, + "loss": 0.6582, + "mean_token_accuracy": 0.7941269040107727, + "num_tokens": 168514524.0, + "step": 71810 + }, + { + "epoch": 0.6584762079398552, + "learning_rate": 6.830659209681856e-05, + "loss": 0.6647, + "mean_token_accuracy": 0.7903441488742828, + "num_tokens": 168539982.0, + "step": 71820 + }, + { + "epoch": 0.6585678921793344, + "learning_rate": 6.828825524892271e-05, + "loss": 0.7085, + "mean_token_accuracy": 0.778989827632904, + "num_tokens": 168564877.0, + "step": 71830 + }, + { + "epoch": 0.6586595764188136, + "learning_rate": 6.826991840102687e-05, + "loss": 0.6232, + "mean_token_accuracy": 0.8072134256362915, + "num_tokens": 168588968.0, + "step": 71840 + }, + { + "epoch": 0.6587512606582928, + "learning_rate": 6.825158155313102e-05, + "loss": 0.6653, + "mean_token_accuracy": 0.7958389580249786, + "num_tokens": 168613877.0, + "step": 71850 + }, + { + "epoch": 0.6588429448977721, + "learning_rate": 6.823324470523518e-05, + "loss": 0.6722, + "mean_token_accuracy": 0.7907417356967926, + "num_tokens": 168638901.0, + "step": 71860 + }, + { + "epoch": 0.6589346291372513, + "learning_rate": 6.821490785733932e-05, + "loss": 0.7133, + "mean_token_accuracy": 0.7794717311859131, + "num_tokens": 168663687.0, + "step": 71870 + }, + { + "epoch": 0.6590263133767306, + "learning_rate": 6.819657100944347e-05, + "loss": 0.6796, + "mean_token_accuracy": 0.7891310036182404, + "num_tokens": 168688512.0, + "step": 71880 + }, + { + "epoch": 0.6591179976162098, + "learning_rate": 6.817823416154764e-05, + "loss": 0.733, + "mean_token_accuracy": 0.7727105498313904, + "num_tokens": 168713530.0, + "step": 71890 + }, + { + "epoch": 0.659209681855689, + "learning_rate": 6.815989731365179e-05, + "loss": 0.6781, + "mean_token_accuracy": 0.7864547491073608, + "num_tokens": 168738377.0, + "step": 71900 + }, + { + "epoch": 0.6593013660951682, + "learning_rate": 6.814156046575594e-05, + "loss": 0.6815, + "mean_token_accuracy": 0.7860010683536529, + "num_tokens": 168762927.0, + "step": 71910 + }, + { + "epoch": 0.6593930503346475, + "learning_rate": 6.81232236178601e-05, + "loss": 0.6738, + "mean_token_accuracy": 0.7960246980190278, + "num_tokens": 168787599.0, + "step": 71920 + }, + { + "epoch": 0.6594847345741267, + "learning_rate": 6.810488676996425e-05, + "loss": 0.7147, + "mean_token_accuracy": 0.783091139793396, + "num_tokens": 168811616.0, + "step": 71930 + }, + { + "epoch": 0.659576418813606, + "learning_rate": 6.80865499220684e-05, + "loss": 0.6475, + "mean_token_accuracy": 0.798850291967392, + "num_tokens": 168836155.0, + "step": 71940 + }, + { + "epoch": 0.6596681030530852, + "learning_rate": 6.806821307417255e-05, + "loss": 0.694, + "mean_token_accuracy": 0.7888308942317963, + "num_tokens": 168861533.0, + "step": 71950 + }, + { + "epoch": 0.6597597872925645, + "learning_rate": 6.804987622627672e-05, + "loss": 0.6861, + "mean_token_accuracy": 0.7865898370742798, + "num_tokens": 168887033.0, + "step": 71960 + }, + { + "epoch": 0.6598514715320436, + "learning_rate": 6.803153937838085e-05, + "loss": 0.6806, + "mean_token_accuracy": 0.790938937664032, + "num_tokens": 168912425.0, + "step": 71970 + }, + { + "epoch": 0.6599431557715228, + "learning_rate": 6.8013202530485e-05, + "loss": 0.673, + "mean_token_accuracy": 0.7866240203380584, + "num_tokens": 168937504.0, + "step": 71980 + }, + { + "epoch": 0.6600348400110021, + "learning_rate": 6.799486568258917e-05, + "loss": 0.6705, + "mean_token_accuracy": 0.7928176879882812, + "num_tokens": 168962648.0, + "step": 71990 + }, + { + "epoch": 0.6601265242504814, + "learning_rate": 6.797652883469332e-05, + "loss": 0.6746, + "mean_token_accuracy": 0.790187019109726, + "num_tokens": 168987769.0, + "step": 72000 + }, + { + "epoch": 0.6602182084899606, + "learning_rate": 6.795819198679747e-05, + "loss": 0.6992, + "mean_token_accuracy": 0.786000233888626, + "num_tokens": 169012666.0, + "step": 72010 + }, + { + "epoch": 0.6603098927294399, + "learning_rate": 6.793985513890163e-05, + "loss": 0.6732, + "mean_token_accuracy": 0.7908929944038391, + "num_tokens": 169038237.0, + "step": 72020 + }, + { + "epoch": 0.660401576968919, + "learning_rate": 6.792151829100578e-05, + "loss": 0.6584, + "mean_token_accuracy": 0.7980163812637329, + "num_tokens": 169064039.0, + "step": 72030 + }, + { + "epoch": 0.6604932612083982, + "learning_rate": 6.790318144310993e-05, + "loss": 0.671, + "mean_token_accuracy": 0.7938000857830048, + "num_tokens": 169088470.0, + "step": 72040 + }, + { + "epoch": 0.6605849454478775, + "learning_rate": 6.788484459521408e-05, + "loss": 0.6717, + "mean_token_accuracy": 0.7914857923984527, + "num_tokens": 169114372.0, + "step": 72050 + }, + { + "epoch": 0.6606766296873567, + "learning_rate": 6.786650774731825e-05, + "loss": 0.6677, + "mean_token_accuracy": 0.7910528302192688, + "num_tokens": 169139429.0, + "step": 72060 + }, + { + "epoch": 0.660768313926836, + "learning_rate": 6.784817089942239e-05, + "loss": 0.7079, + "mean_token_accuracy": 0.7883346676826477, + "num_tokens": 169164013.0, + "step": 72070 + }, + { + "epoch": 0.6608599981663152, + "learning_rate": 6.782983405152654e-05, + "loss": 0.6556, + "mean_token_accuracy": 0.7989653050899506, + "num_tokens": 169188963.0, + "step": 72080 + }, + { + "epoch": 0.6609516824057945, + "learning_rate": 6.78114972036307e-05, + "loss": 0.735, + "mean_token_accuracy": 0.7789423286914825, + "num_tokens": 169214278.0, + "step": 72090 + }, + { + "epoch": 0.6610433666452736, + "learning_rate": 6.779316035573485e-05, + "loss": 0.6858, + "mean_token_accuracy": 0.7885903954505921, + "num_tokens": 169238598.0, + "step": 72100 + }, + { + "epoch": 0.6611350508847529, + "learning_rate": 6.7774823507839e-05, + "loss": 0.6708, + "mean_token_accuracy": 0.7963763773441315, + "num_tokens": 169263385.0, + "step": 72110 + }, + { + "epoch": 0.6612267351242321, + "learning_rate": 6.775648665994316e-05, + "loss": 0.6832, + "mean_token_accuracy": 0.7952436149120331, + "num_tokens": 169288176.0, + "step": 72120 + }, + { + "epoch": 0.6613184193637114, + "learning_rate": 6.773814981204731e-05, + "loss": 0.6525, + "mean_token_accuracy": 0.7992342174053192, + "num_tokens": 169313511.0, + "step": 72130 + }, + { + "epoch": 0.6614101036031906, + "learning_rate": 6.771981296415146e-05, + "loss": 0.6424, + "mean_token_accuracy": 0.8027814626693726, + "num_tokens": 169338622.0, + "step": 72140 + }, + { + "epoch": 0.6615017878426699, + "learning_rate": 6.770147611625563e-05, + "loss": 0.7212, + "mean_token_accuracy": 0.7763095557689667, + "num_tokens": 169364650.0, + "step": 72150 + }, + { + "epoch": 0.661593472082149, + "learning_rate": 6.768313926835978e-05, + "loss": 0.6764, + "mean_token_accuracy": 0.7919943451881408, + "num_tokens": 169390729.0, + "step": 72160 + }, + { + "epoch": 0.6616851563216283, + "learning_rate": 6.766480242046392e-05, + "loss": 0.7052, + "mean_token_accuracy": 0.782336163520813, + "num_tokens": 169415761.0, + "step": 72170 + }, + { + "epoch": 0.6617768405611075, + "learning_rate": 6.764646557256807e-05, + "loss": 0.6943, + "mean_token_accuracy": 0.7865187466144562, + "num_tokens": 169441300.0, + "step": 72180 + }, + { + "epoch": 0.6618685248005868, + "learning_rate": 6.762812872467224e-05, + "loss": 0.6811, + "mean_token_accuracy": 0.7896221995353698, + "num_tokens": 169466401.0, + "step": 72190 + }, + { + "epoch": 0.661960209040066, + "learning_rate": 6.760979187677639e-05, + "loss": 0.6797, + "mean_token_accuracy": 0.7934462070465088, + "num_tokens": 169490490.0, + "step": 72200 + }, + { + "epoch": 0.6620518932795453, + "learning_rate": 6.759145502888054e-05, + "loss": 0.6536, + "mean_token_accuracy": 0.7974579572677613, + "num_tokens": 169515795.0, + "step": 72210 + }, + { + "epoch": 0.6621435775190245, + "learning_rate": 6.757311818098469e-05, + "loss": 0.6828, + "mean_token_accuracy": 0.7918470799922943, + "num_tokens": 169541617.0, + "step": 72220 + }, + { + "epoch": 0.6622352617585037, + "learning_rate": 6.755478133308884e-05, + "loss": 0.6789, + "mean_token_accuracy": 0.79769948720932, + "num_tokens": 169566238.0, + "step": 72230 + }, + { + "epoch": 0.6623269459979829, + "learning_rate": 6.7536444485193e-05, + "loss": 0.6874, + "mean_token_accuracy": 0.7852485775947571, + "num_tokens": 169590963.0, + "step": 72240 + }, + { + "epoch": 0.6624186302374622, + "learning_rate": 6.751810763729716e-05, + "loss": 0.6587, + "mean_token_accuracy": 0.7933691024780274, + "num_tokens": 169615570.0, + "step": 72250 + }, + { + "epoch": 0.6625103144769414, + "learning_rate": 6.749977078940131e-05, + "loss": 0.6882, + "mean_token_accuracy": 0.7925223767757416, + "num_tokens": 169641329.0, + "step": 72260 + }, + { + "epoch": 0.6626019987164207, + "learning_rate": 6.748143394150545e-05, + "loss": 0.6557, + "mean_token_accuracy": 0.7946510136127471, + "num_tokens": 169666528.0, + "step": 72270 + }, + { + "epoch": 0.6626936829558999, + "learning_rate": 6.74630970936096e-05, + "loss": 0.7183, + "mean_token_accuracy": 0.7837998986244201, + "num_tokens": 169691669.0, + "step": 72280 + }, + { + "epoch": 0.6627853671953791, + "learning_rate": 6.744476024571377e-05, + "loss": 0.6883, + "mean_token_accuracy": 0.7890930533409118, + "num_tokens": 169716903.0, + "step": 72290 + }, + { + "epoch": 0.6628770514348583, + "learning_rate": 6.742642339781792e-05, + "loss": 0.7106, + "mean_token_accuracy": 0.782125735282898, + "num_tokens": 169741843.0, + "step": 72300 + }, + { + "epoch": 0.6629687356743376, + "learning_rate": 6.740808654992207e-05, + "loss": 0.6576, + "mean_token_accuracy": 0.7944453895092011, + "num_tokens": 169766789.0, + "step": 72310 + }, + { + "epoch": 0.6630604199138168, + "learning_rate": 6.738974970202622e-05, + "loss": 0.6641, + "mean_token_accuracy": 0.7893314301967621, + "num_tokens": 169792335.0, + "step": 72320 + }, + { + "epoch": 0.6631521041532961, + "learning_rate": 6.737141285413037e-05, + "loss": 0.6825, + "mean_token_accuracy": 0.7878741383552551, + "num_tokens": 169816737.0, + "step": 72330 + }, + { + "epoch": 0.6632437883927753, + "learning_rate": 6.735307600623453e-05, + "loss": 0.6768, + "mean_token_accuracy": 0.7936313450336456, + "num_tokens": 169841544.0, + "step": 72340 + }, + { + "epoch": 0.6633354726322546, + "learning_rate": 6.733473915833869e-05, + "loss": 0.6719, + "mean_token_accuracy": 0.7930039465427399, + "num_tokens": 169866904.0, + "step": 72350 + }, + { + "epoch": 0.6634271568717337, + "learning_rate": 6.731640231044284e-05, + "loss": 0.6814, + "mean_token_accuracy": 0.780381029844284, + "num_tokens": 169891983.0, + "step": 72360 + }, + { + "epoch": 0.663518841111213, + "learning_rate": 6.729806546254698e-05, + "loss": 0.7025, + "mean_token_accuracy": 0.7849653840065003, + "num_tokens": 169916888.0, + "step": 72370 + }, + { + "epoch": 0.6636105253506922, + "learning_rate": 6.727972861465115e-05, + "loss": 0.671, + "mean_token_accuracy": 0.7922280192375183, + "num_tokens": 169942786.0, + "step": 72380 + }, + { + "epoch": 0.6637022095901715, + "learning_rate": 6.72613917667553e-05, + "loss": 0.6817, + "mean_token_accuracy": 0.7830262303352356, + "num_tokens": 169967689.0, + "step": 72390 + }, + { + "epoch": 0.6637938938296507, + "learning_rate": 6.724305491885945e-05, + "loss": 0.7013, + "mean_token_accuracy": 0.7871264457702637, + "num_tokens": 169992642.0, + "step": 72400 + }, + { + "epoch": 0.66388557806913, + "learning_rate": 6.72247180709636e-05, + "loss": 0.6718, + "mean_token_accuracy": 0.7969866991043091, + "num_tokens": 170018387.0, + "step": 72410 + }, + { + "epoch": 0.6639772623086091, + "learning_rate": 6.720638122306776e-05, + "loss": 0.6928, + "mean_token_accuracy": 0.786678147315979, + "num_tokens": 170043542.0, + "step": 72420 + }, + { + "epoch": 0.6640689465480883, + "learning_rate": 6.718804437517191e-05, + "loss": 0.684, + "mean_token_accuracy": 0.7954052209854126, + "num_tokens": 170069024.0, + "step": 72430 + }, + { + "epoch": 0.6641606307875676, + "learning_rate": 6.716970752727606e-05, + "loss": 0.7049, + "mean_token_accuracy": 0.7860666513442993, + "num_tokens": 170094224.0, + "step": 72440 + }, + { + "epoch": 0.6642523150270468, + "learning_rate": 6.715137067938022e-05, + "loss": 0.6566, + "mean_token_accuracy": 0.7930137574672699, + "num_tokens": 170119561.0, + "step": 72450 + }, + { + "epoch": 0.6643439992665261, + "learning_rate": 6.713303383148438e-05, + "loss": 0.6375, + "mean_token_accuracy": 0.8034508168697357, + "num_tokens": 170144527.0, + "step": 72460 + }, + { + "epoch": 0.6644356835060053, + "learning_rate": 6.711469698358851e-05, + "loss": 0.6943, + "mean_token_accuracy": 0.7905678987503052, + "num_tokens": 170169450.0, + "step": 72470 + }, + { + "epoch": 0.6645273677454846, + "learning_rate": 6.709636013569268e-05, + "loss": 0.6599, + "mean_token_accuracy": 0.7895504474639893, + "num_tokens": 170194966.0, + "step": 72480 + }, + { + "epoch": 0.6646190519849637, + "learning_rate": 6.707802328779683e-05, + "loss": 0.6562, + "mean_token_accuracy": 0.7965170204639435, + "num_tokens": 170220289.0, + "step": 72490 + }, + { + "epoch": 0.664710736224443, + "learning_rate": 6.705968643990098e-05, + "loss": 0.6629, + "mean_token_accuracy": 0.7979708194732666, + "num_tokens": 170245545.0, + "step": 72500 + }, + { + "epoch": 0.6648024204639222, + "learning_rate": 6.704134959200515e-05, + "loss": 0.68, + "mean_token_accuracy": 0.7887271881103516, + "num_tokens": 170270007.0, + "step": 72510 + }, + { + "epoch": 0.6648941047034015, + "learning_rate": 6.702301274410929e-05, + "loss": 0.6495, + "mean_token_accuracy": 0.793360835313797, + "num_tokens": 170294936.0, + "step": 72520 + }, + { + "epoch": 0.6649857889428807, + "learning_rate": 6.700467589621344e-05, + "loss": 0.6705, + "mean_token_accuracy": 0.7929691433906555, + "num_tokens": 170320028.0, + "step": 72530 + }, + { + "epoch": 0.66507747318236, + "learning_rate": 6.698633904831759e-05, + "loss": 0.6714, + "mean_token_accuracy": 0.7888080418109894, + "num_tokens": 170344859.0, + "step": 72540 + }, + { + "epoch": 0.6651691574218392, + "learning_rate": 6.696800220042176e-05, + "loss": 0.695, + "mean_token_accuracy": 0.7836909532546997, + "num_tokens": 170369640.0, + "step": 72550 + }, + { + "epoch": 0.6652608416613184, + "learning_rate": 6.694966535252591e-05, + "loss": 0.6606, + "mean_token_accuracy": 0.7975388288497924, + "num_tokens": 170394568.0, + "step": 72560 + }, + { + "epoch": 0.6653525259007976, + "learning_rate": 6.693132850463005e-05, + "loss": 0.707, + "mean_token_accuracy": 0.7804718494415284, + "num_tokens": 170419414.0, + "step": 72570 + }, + { + "epoch": 0.6654442101402769, + "learning_rate": 6.691299165673421e-05, + "loss": 0.6756, + "mean_token_accuracy": 0.7886490046977996, + "num_tokens": 170444401.0, + "step": 72580 + }, + { + "epoch": 0.6655358943797561, + "learning_rate": 6.689465480883836e-05, + "loss": 0.7255, + "mean_token_accuracy": 0.7776539385318756, + "num_tokens": 170469876.0, + "step": 72590 + }, + { + "epoch": 0.6656275786192354, + "learning_rate": 6.687631796094252e-05, + "loss": 0.6542, + "mean_token_accuracy": 0.7902257859706878, + "num_tokens": 170493939.0, + "step": 72600 + }, + { + "epoch": 0.6657192628587146, + "learning_rate": 6.685798111304668e-05, + "loss": 0.6736, + "mean_token_accuracy": 0.7904944241046905, + "num_tokens": 170518678.0, + "step": 72610 + }, + { + "epoch": 0.6658109470981938, + "learning_rate": 6.683964426515082e-05, + "loss": 0.6942, + "mean_token_accuracy": 0.7855430006980896, + "num_tokens": 170544146.0, + "step": 72620 + }, + { + "epoch": 0.665902631337673, + "learning_rate": 6.682130741725497e-05, + "loss": 0.702, + "mean_token_accuracy": 0.784555172920227, + "num_tokens": 170569430.0, + "step": 72630 + }, + { + "epoch": 0.6659943155771523, + "learning_rate": 6.680297056935914e-05, + "loss": 0.6786, + "mean_token_accuracy": 0.7891363143920899, + "num_tokens": 170594523.0, + "step": 72640 + }, + { + "epoch": 0.6660859998166315, + "learning_rate": 6.678463372146329e-05, + "loss": 0.6533, + "mean_token_accuracy": 0.7904845714569092, + "num_tokens": 170619528.0, + "step": 72650 + }, + { + "epoch": 0.6661776840561108, + "learning_rate": 6.676629687356744e-05, + "loss": 0.6692, + "mean_token_accuracy": 0.7959149599075317, + "num_tokens": 170643898.0, + "step": 72660 + }, + { + "epoch": 0.66626936829559, + "learning_rate": 6.674796002567158e-05, + "loss": 0.6944, + "mean_token_accuracy": 0.7878892064094544, + "num_tokens": 170669116.0, + "step": 72670 + }, + { + "epoch": 0.6663610525350693, + "learning_rate": 6.672962317777574e-05, + "loss": 0.6694, + "mean_token_accuracy": 0.783225154876709, + "num_tokens": 170694052.0, + "step": 72680 + }, + { + "epoch": 0.6664527367745484, + "learning_rate": 6.67112863298799e-05, + "loss": 0.6842, + "mean_token_accuracy": 0.7891632854938507, + "num_tokens": 170719295.0, + "step": 72690 + }, + { + "epoch": 0.6665444210140277, + "learning_rate": 6.669294948198405e-05, + "loss": 0.6794, + "mean_token_accuracy": 0.7890183508396149, + "num_tokens": 170743973.0, + "step": 72700 + }, + { + "epoch": 0.6666361052535069, + "learning_rate": 6.667461263408821e-05, + "loss": 0.6688, + "mean_token_accuracy": 0.7928049027919769, + "num_tokens": 170770263.0, + "step": 72710 + }, + { + "epoch": 0.6667277894929862, + "learning_rate": 6.665627578619235e-05, + "loss": 0.6981, + "mean_token_accuracy": 0.7866098165512085, + "num_tokens": 170795734.0, + "step": 72720 + }, + { + "epoch": 0.6668194737324654, + "learning_rate": 6.66379389382965e-05, + "loss": 0.6872, + "mean_token_accuracy": 0.7820593237876892, + "num_tokens": 170821340.0, + "step": 72730 + }, + { + "epoch": 0.6669111579719447, + "learning_rate": 6.661960209040067e-05, + "loss": 0.6711, + "mean_token_accuracy": 0.7926416516304016, + "num_tokens": 170846356.0, + "step": 72740 + }, + { + "epoch": 0.6670028422114238, + "learning_rate": 6.660126524250482e-05, + "loss": 0.6996, + "mean_token_accuracy": 0.7878145575523376, + "num_tokens": 170872345.0, + "step": 72750 + }, + { + "epoch": 0.6670945264509031, + "learning_rate": 6.658292839460897e-05, + "loss": 0.7001, + "mean_token_accuracy": 0.7886099994182587, + "num_tokens": 170897693.0, + "step": 72760 + }, + { + "epoch": 0.6671862106903823, + "learning_rate": 6.656459154671312e-05, + "loss": 0.6685, + "mean_token_accuracy": 0.7847908437252045, + "num_tokens": 170922159.0, + "step": 72770 + }, + { + "epoch": 0.6672778949298616, + "learning_rate": 6.654625469881728e-05, + "loss": 0.6428, + "mean_token_accuracy": 0.8001977264881134, + "num_tokens": 170947580.0, + "step": 72780 + }, + { + "epoch": 0.6673695791693408, + "learning_rate": 6.652791785092143e-05, + "loss": 0.6993, + "mean_token_accuracy": 0.782284551858902, + "num_tokens": 170972474.0, + "step": 72790 + }, + { + "epoch": 0.6674612634088201, + "learning_rate": 6.650958100302558e-05, + "loss": 0.6919, + "mean_token_accuracy": 0.7873977839946746, + "num_tokens": 170997899.0, + "step": 72800 + }, + { + "epoch": 0.6675529476482993, + "learning_rate": 6.649124415512975e-05, + "loss": 0.6935, + "mean_token_accuracy": 0.7870490491390228, + "num_tokens": 171023387.0, + "step": 72810 + }, + { + "epoch": 0.6676446318877785, + "learning_rate": 6.647290730723388e-05, + "loss": 0.6304, + "mean_token_accuracy": 0.7952752888202668, + "num_tokens": 171048621.0, + "step": 72820 + }, + { + "epoch": 0.6677363161272577, + "learning_rate": 6.645457045933804e-05, + "loss": 0.7084, + "mean_token_accuracy": 0.7862338602542878, + "num_tokens": 171073649.0, + "step": 72830 + }, + { + "epoch": 0.667828000366737, + "learning_rate": 6.64362336114422e-05, + "loss": 0.7063, + "mean_token_accuracy": 0.7843965888023376, + "num_tokens": 171098166.0, + "step": 72840 + }, + { + "epoch": 0.6679196846062162, + "learning_rate": 6.641789676354635e-05, + "loss": 0.6897, + "mean_token_accuracy": 0.78678657412529, + "num_tokens": 171123799.0, + "step": 72850 + }, + { + "epoch": 0.6680113688456955, + "learning_rate": 6.63995599156505e-05, + "loss": 0.71, + "mean_token_accuracy": 0.7828811645507813, + "num_tokens": 171148727.0, + "step": 72860 + }, + { + "epoch": 0.6681030530851747, + "learning_rate": 6.638122306775466e-05, + "loss": 0.6397, + "mean_token_accuracy": 0.7992956578731537, + "num_tokens": 171174453.0, + "step": 72870 + }, + { + "epoch": 0.6681947373246538, + "learning_rate": 6.636288621985881e-05, + "loss": 0.7121, + "mean_token_accuracy": 0.7838517189025879, + "num_tokens": 171199307.0, + "step": 72880 + }, + { + "epoch": 0.6682864215641331, + "learning_rate": 6.634454937196296e-05, + "loss": 0.6759, + "mean_token_accuracy": 0.7882214546203613, + "num_tokens": 171223982.0, + "step": 72890 + }, + { + "epoch": 0.6683781058036123, + "learning_rate": 6.632621252406711e-05, + "loss": 0.6526, + "mean_token_accuracy": 0.7965757131576539, + "num_tokens": 171249323.0, + "step": 72900 + }, + { + "epoch": 0.6684697900430916, + "learning_rate": 6.630787567617128e-05, + "loss": 0.6633, + "mean_token_accuracy": 0.799387526512146, + "num_tokens": 171275064.0, + "step": 72910 + }, + { + "epoch": 0.6685614742825708, + "learning_rate": 6.628953882827542e-05, + "loss": 0.7091, + "mean_token_accuracy": 0.7831669270992279, + "num_tokens": 171300116.0, + "step": 72920 + }, + { + "epoch": 0.6686531585220501, + "learning_rate": 6.627120198037957e-05, + "loss": 0.71, + "mean_token_accuracy": 0.7740885138511657, + "num_tokens": 171325405.0, + "step": 72930 + }, + { + "epoch": 0.6687448427615293, + "learning_rate": 6.625286513248373e-05, + "loss": 0.6874, + "mean_token_accuracy": 0.7902782261371613, + "num_tokens": 171349948.0, + "step": 72940 + }, + { + "epoch": 0.6688365270010085, + "learning_rate": 6.623452828458789e-05, + "loss": 0.7185, + "mean_token_accuracy": 0.7837597966194153, + "num_tokens": 171375229.0, + "step": 72950 + }, + { + "epoch": 0.6689282112404877, + "learning_rate": 6.621619143669204e-05, + "loss": 0.6605, + "mean_token_accuracy": 0.790293139219284, + "num_tokens": 171400530.0, + "step": 72960 + }, + { + "epoch": 0.669019895479967, + "learning_rate": 6.619785458879619e-05, + "loss": 0.6556, + "mean_token_accuracy": 0.7881445765495301, + "num_tokens": 171425526.0, + "step": 72970 + }, + { + "epoch": 0.6691115797194462, + "learning_rate": 6.617951774090034e-05, + "loss": 0.6922, + "mean_token_accuracy": 0.7873681724071503, + "num_tokens": 171450600.0, + "step": 72980 + }, + { + "epoch": 0.6692032639589255, + "learning_rate": 6.616118089300449e-05, + "loss": 0.6467, + "mean_token_accuracy": 0.7983907639980317, + "num_tokens": 171475655.0, + "step": 72990 + }, + { + "epoch": 0.6692949481984047, + "learning_rate": 6.614284404510866e-05, + "loss": 0.6668, + "mean_token_accuracy": 0.795628833770752, + "num_tokens": 171500945.0, + "step": 73000 + }, + { + "epoch": 0.6693866324378839, + "learning_rate": 6.612450719721281e-05, + "loss": 0.7142, + "mean_token_accuracy": 0.7879930019378663, + "num_tokens": 171525963.0, + "step": 73010 + }, + { + "epoch": 0.6694783166773631, + "learning_rate": 6.610617034931695e-05, + "loss": 0.7424, + "mean_token_accuracy": 0.778604942560196, + "num_tokens": 171551319.0, + "step": 73020 + }, + { + "epoch": 0.6695700009168424, + "learning_rate": 6.60878335014211e-05, + "loss": 0.7064, + "mean_token_accuracy": 0.7856544494628906, + "num_tokens": 171577097.0, + "step": 73030 + }, + { + "epoch": 0.6696616851563216, + "learning_rate": 6.606949665352527e-05, + "loss": 0.6927, + "mean_token_accuracy": 0.7791128635406495, + "num_tokens": 171601450.0, + "step": 73040 + }, + { + "epoch": 0.6697533693958009, + "learning_rate": 6.605115980562942e-05, + "loss": 0.6908, + "mean_token_accuracy": 0.7919116795063019, + "num_tokens": 171626694.0, + "step": 73050 + }, + { + "epoch": 0.6698450536352801, + "learning_rate": 6.603282295773357e-05, + "loss": 0.6766, + "mean_token_accuracy": 0.7944331347942353, + "num_tokens": 171651962.0, + "step": 73060 + }, + { + "epoch": 0.6699367378747594, + "learning_rate": 6.601448610983772e-05, + "loss": 0.7054, + "mean_token_accuracy": 0.7812461495399475, + "num_tokens": 171676244.0, + "step": 73070 + }, + { + "epoch": 0.6700284221142385, + "learning_rate": 6.599614926194187e-05, + "loss": 0.654, + "mean_token_accuracy": 0.7955682694911956, + "num_tokens": 171703177.0, + "step": 73080 + }, + { + "epoch": 0.6701201063537178, + "learning_rate": 6.597781241404603e-05, + "loss": 0.68, + "mean_token_accuracy": 0.7879145562648773, + "num_tokens": 171728410.0, + "step": 73090 + }, + { + "epoch": 0.670211790593197, + "learning_rate": 6.595947556615019e-05, + "loss": 0.7112, + "mean_token_accuracy": 0.7802545547485351, + "num_tokens": 171753339.0, + "step": 73100 + }, + { + "epoch": 0.6703034748326763, + "learning_rate": 6.594113871825434e-05, + "loss": 0.6859, + "mean_token_accuracy": 0.7883873760700226, + "num_tokens": 171778954.0, + "step": 73110 + }, + { + "epoch": 0.6703951590721555, + "learning_rate": 6.592280187035848e-05, + "loss": 0.6746, + "mean_token_accuracy": 0.7894088745117187, + "num_tokens": 171803285.0, + "step": 73120 + }, + { + "epoch": 0.6704868433116348, + "learning_rate": 6.590446502246265e-05, + "loss": 0.6615, + "mean_token_accuracy": 0.7912877678871155, + "num_tokens": 171828691.0, + "step": 73130 + }, + { + "epoch": 0.6705785275511139, + "learning_rate": 6.58861281745668e-05, + "loss": 0.6771, + "mean_token_accuracy": 0.7839479625225068, + "num_tokens": 171853681.0, + "step": 73140 + }, + { + "epoch": 0.6706702117905932, + "learning_rate": 6.586779132667095e-05, + "loss": 0.6995, + "mean_token_accuracy": 0.7861020505428314, + "num_tokens": 171879410.0, + "step": 73150 + }, + { + "epoch": 0.6707618960300724, + "learning_rate": 6.58494544787751e-05, + "loss": 0.6972, + "mean_token_accuracy": 0.7826953828334808, + "num_tokens": 171904417.0, + "step": 73160 + }, + { + "epoch": 0.6708535802695517, + "learning_rate": 6.583111763087925e-05, + "loss": 0.6528, + "mean_token_accuracy": 0.8015499711036682, + "num_tokens": 171929734.0, + "step": 73170 + }, + { + "epoch": 0.6709452645090309, + "learning_rate": 6.58127807829834e-05, + "loss": 0.6749, + "mean_token_accuracy": 0.7938455700874328, + "num_tokens": 171954603.0, + "step": 73180 + }, + { + "epoch": 0.6710369487485102, + "learning_rate": 6.579444393508756e-05, + "loss": 0.6744, + "mean_token_accuracy": 0.7895184636116028, + "num_tokens": 171979922.0, + "step": 73190 + }, + { + "epoch": 0.6711286329879894, + "learning_rate": 6.577610708719172e-05, + "loss": 0.6739, + "mean_token_accuracy": 0.789273327589035, + "num_tokens": 172004445.0, + "step": 73200 + }, + { + "epoch": 0.6712203172274686, + "learning_rate": 6.575777023929587e-05, + "loss": 0.715, + "mean_token_accuracy": 0.7817219018936157, + "num_tokens": 172029100.0, + "step": 73210 + }, + { + "epoch": 0.6713120014669478, + "learning_rate": 6.573943339140001e-05, + "loss": 0.6669, + "mean_token_accuracy": 0.7843082010746002, + "num_tokens": 172054157.0, + "step": 73220 + }, + { + "epoch": 0.6714036857064271, + "learning_rate": 6.572109654350418e-05, + "loss": 0.7128, + "mean_token_accuracy": 0.7877836048603057, + "num_tokens": 172080180.0, + "step": 73230 + }, + { + "epoch": 0.6714953699459063, + "learning_rate": 6.570275969560833e-05, + "loss": 0.6713, + "mean_token_accuracy": 0.7891487896442413, + "num_tokens": 172105474.0, + "step": 73240 + }, + { + "epoch": 0.6715870541853856, + "learning_rate": 6.568442284771248e-05, + "loss": 0.6367, + "mean_token_accuracy": 0.8021510303020477, + "num_tokens": 172130652.0, + "step": 73250 + }, + { + "epoch": 0.6716787384248648, + "learning_rate": 6.566608599981663e-05, + "loss": 0.6515, + "mean_token_accuracy": 0.7935626208782196, + "num_tokens": 172155382.0, + "step": 73260 + }, + { + "epoch": 0.671770422664344, + "learning_rate": 6.564774915192079e-05, + "loss": 0.6671, + "mean_token_accuracy": 0.7954720377922058, + "num_tokens": 172179711.0, + "step": 73270 + }, + { + "epoch": 0.6718621069038232, + "learning_rate": 6.562941230402494e-05, + "loss": 0.6753, + "mean_token_accuracy": 0.7912381947040558, + "num_tokens": 172204436.0, + "step": 73280 + }, + { + "epoch": 0.6719537911433024, + "learning_rate": 6.561107545612909e-05, + "loss": 0.6721, + "mean_token_accuracy": 0.7904717266559601, + "num_tokens": 172229578.0, + "step": 73290 + }, + { + "epoch": 0.6720454753827817, + "learning_rate": 6.559273860823326e-05, + "loss": 0.6599, + "mean_token_accuracy": 0.7967093229293823, + "num_tokens": 172254616.0, + "step": 73300 + }, + { + "epoch": 0.672137159622261, + "learning_rate": 6.557440176033741e-05, + "loss": 0.7043, + "mean_token_accuracy": 0.786264979839325, + "num_tokens": 172279921.0, + "step": 73310 + }, + { + "epoch": 0.6722288438617402, + "learning_rate": 6.555606491244155e-05, + "loss": 0.6793, + "mean_token_accuracy": 0.7897971332073211, + "num_tokens": 172304945.0, + "step": 73320 + }, + { + "epoch": 0.6723205281012195, + "learning_rate": 6.553772806454571e-05, + "loss": 0.6589, + "mean_token_accuracy": 0.7984269201755524, + "num_tokens": 172330363.0, + "step": 73330 + }, + { + "epoch": 0.6724122123406986, + "learning_rate": 6.551939121664986e-05, + "loss": 0.6807, + "mean_token_accuracy": 0.7922760248184204, + "num_tokens": 172356502.0, + "step": 73340 + }, + { + "epoch": 0.6725038965801778, + "learning_rate": 6.550105436875401e-05, + "loss": 0.7083, + "mean_token_accuracy": 0.7910124242305756, + "num_tokens": 172381830.0, + "step": 73350 + }, + { + "epoch": 0.6725955808196571, + "learning_rate": 6.548271752085817e-05, + "loss": 0.6998, + "mean_token_accuracy": 0.784187787771225, + "num_tokens": 172405797.0, + "step": 73360 + }, + { + "epoch": 0.6726872650591363, + "learning_rate": 6.546438067296232e-05, + "loss": 0.6606, + "mean_token_accuracy": 0.7906575322151184, + "num_tokens": 172430719.0, + "step": 73370 + }, + { + "epoch": 0.6727789492986156, + "learning_rate": 6.544604382506647e-05, + "loss": 0.6918, + "mean_token_accuracy": 0.7964638113975525, + "num_tokens": 172455765.0, + "step": 73380 + }, + { + "epoch": 0.6728706335380948, + "learning_rate": 6.542770697717064e-05, + "loss": 0.7141, + "mean_token_accuracy": 0.7809453129768371, + "num_tokens": 172481310.0, + "step": 73390 + }, + { + "epoch": 0.672962317777574, + "learning_rate": 6.540937012927479e-05, + "loss": 0.7024, + "mean_token_accuracy": 0.7876185357570649, + "num_tokens": 172506628.0, + "step": 73400 + }, + { + "epoch": 0.6730540020170532, + "learning_rate": 6.539103328137894e-05, + "loss": 0.703, + "mean_token_accuracy": 0.7867640376091003, + "num_tokens": 172531864.0, + "step": 73410 + }, + { + "epoch": 0.6731456862565325, + "learning_rate": 6.537269643348308e-05, + "loss": 0.6707, + "mean_token_accuracy": 0.789568567276001, + "num_tokens": 172556350.0, + "step": 73420 + }, + { + "epoch": 0.6732373704960117, + "learning_rate": 6.535435958558724e-05, + "loss": 0.6982, + "mean_token_accuracy": 0.7860197365283966, + "num_tokens": 172580987.0, + "step": 73430 + }, + { + "epoch": 0.673329054735491, + "learning_rate": 6.53360227376914e-05, + "loss": 0.6548, + "mean_token_accuracy": 0.790365743637085, + "num_tokens": 172606019.0, + "step": 73440 + }, + { + "epoch": 0.6734207389749702, + "learning_rate": 6.531768588979555e-05, + "loss": 0.7315, + "mean_token_accuracy": 0.7806772828102112, + "num_tokens": 172630551.0, + "step": 73450 + }, + { + "epoch": 0.6735124232144495, + "learning_rate": 6.52993490418997e-05, + "loss": 0.6828, + "mean_token_accuracy": 0.7910055220127106, + "num_tokens": 172656906.0, + "step": 73460 + }, + { + "epoch": 0.6736041074539286, + "learning_rate": 6.528101219400385e-05, + "loss": 0.6804, + "mean_token_accuracy": 0.7891456961631775, + "num_tokens": 172682163.0, + "step": 73470 + }, + { + "epoch": 0.6736957916934079, + "learning_rate": 6.5262675346108e-05, + "loss": 0.6349, + "mean_token_accuracy": 0.7979587912559509, + "num_tokens": 172707135.0, + "step": 73480 + }, + { + "epoch": 0.6737874759328871, + "learning_rate": 6.524433849821217e-05, + "loss": 0.68, + "mean_token_accuracy": 0.7888090193271637, + "num_tokens": 172732381.0, + "step": 73490 + }, + { + "epoch": 0.6738791601723664, + "learning_rate": 6.522600165031632e-05, + "loss": 0.6538, + "mean_token_accuracy": 0.7977280199527741, + "num_tokens": 172757946.0, + "step": 73500 + }, + { + "epoch": 0.6739708444118456, + "learning_rate": 6.520766480242047e-05, + "loss": 0.6804, + "mean_token_accuracy": 0.7910053670406342, + "num_tokens": 172782827.0, + "step": 73510 + }, + { + "epoch": 0.6740625286513249, + "learning_rate": 6.518932795452461e-05, + "loss": 0.6945, + "mean_token_accuracy": 0.7873681724071503, + "num_tokens": 172808140.0, + "step": 73520 + }, + { + "epoch": 0.674154212890804, + "learning_rate": 6.517099110662878e-05, + "loss": 0.6549, + "mean_token_accuracy": 0.7948734998703003, + "num_tokens": 172833779.0, + "step": 73530 + }, + { + "epoch": 0.6742458971302833, + "learning_rate": 6.515265425873293e-05, + "loss": 0.6752, + "mean_token_accuracy": 0.7912993013858796, + "num_tokens": 172858455.0, + "step": 73540 + }, + { + "epoch": 0.6743375813697625, + "learning_rate": 6.513431741083708e-05, + "loss": 0.6667, + "mean_token_accuracy": 0.7883789777755738, + "num_tokens": 172883605.0, + "step": 73550 + }, + { + "epoch": 0.6744292656092418, + "learning_rate": 6.511598056294123e-05, + "loss": 0.6969, + "mean_token_accuracy": 0.7820520997047424, + "num_tokens": 172908248.0, + "step": 73560 + }, + { + "epoch": 0.674520949848721, + "learning_rate": 6.509764371504538e-05, + "loss": 0.6855, + "mean_token_accuracy": 0.7876793026924134, + "num_tokens": 172933553.0, + "step": 73570 + }, + { + "epoch": 0.6746126340882003, + "learning_rate": 6.507930686714953e-05, + "loss": 0.6937, + "mean_token_accuracy": 0.7893419742584229, + "num_tokens": 172958479.0, + "step": 73580 + }, + { + "epoch": 0.6747043183276795, + "learning_rate": 6.50609700192537e-05, + "loss": 0.6733, + "mean_token_accuracy": 0.7927237272262573, + "num_tokens": 172983148.0, + "step": 73590 + }, + { + "epoch": 0.6747960025671587, + "learning_rate": 6.504263317135785e-05, + "loss": 0.6691, + "mean_token_accuracy": 0.792727929353714, + "num_tokens": 173008560.0, + "step": 73600 + }, + { + "epoch": 0.6748876868066379, + "learning_rate": 6.5024296323462e-05, + "loss": 0.6401, + "mean_token_accuracy": 0.8001432240009307, + "num_tokens": 173033695.0, + "step": 73610 + }, + { + "epoch": 0.6749793710461172, + "learning_rate": 6.500595947556616e-05, + "loss": 0.6549, + "mean_token_accuracy": 0.792980182170868, + "num_tokens": 173059877.0, + "step": 73620 + }, + { + "epoch": 0.6750710552855964, + "learning_rate": 6.498762262767031e-05, + "loss": 0.6909, + "mean_token_accuracy": 0.785872858762741, + "num_tokens": 173084537.0, + "step": 73630 + }, + { + "epoch": 0.6751627395250757, + "learning_rate": 6.496928577977446e-05, + "loss": 0.6566, + "mean_token_accuracy": 0.7980120778083801, + "num_tokens": 173109454.0, + "step": 73640 + }, + { + "epoch": 0.6752544237645549, + "learning_rate": 6.495094893187861e-05, + "loss": 0.6648, + "mean_token_accuracy": 0.794419401884079, + "num_tokens": 173134122.0, + "step": 73650 + }, + { + "epoch": 0.675346108004034, + "learning_rate": 6.493261208398276e-05, + "loss": 0.6476, + "mean_token_accuracy": 0.7986183345317841, + "num_tokens": 173159670.0, + "step": 73660 + }, + { + "epoch": 0.6754377922435133, + "learning_rate": 6.491427523608691e-05, + "loss": 0.6697, + "mean_token_accuracy": 0.7906152844429016, + "num_tokens": 173184164.0, + "step": 73670 + }, + { + "epoch": 0.6755294764829926, + "learning_rate": 6.489593838819107e-05, + "loss": 0.6596, + "mean_token_accuracy": 0.7963453114032746, + "num_tokens": 173208593.0, + "step": 73680 + }, + { + "epoch": 0.6756211607224718, + "learning_rate": 6.487760154029523e-05, + "loss": 0.6589, + "mean_token_accuracy": 0.79412140250206, + "num_tokens": 173233750.0, + "step": 73690 + }, + { + "epoch": 0.675712844961951, + "learning_rate": 6.485926469239938e-05, + "loss": 0.676, + "mean_token_accuracy": 0.7839472711086273, + "num_tokens": 173258367.0, + "step": 73700 + }, + { + "epoch": 0.6758045292014303, + "learning_rate": 6.484092784450354e-05, + "loss": 0.7077, + "mean_token_accuracy": 0.7804653346538544, + "num_tokens": 173283046.0, + "step": 73710 + }, + { + "epoch": 0.6758962134409096, + "learning_rate": 6.482259099660769e-05, + "loss": 0.6481, + "mean_token_accuracy": 0.7937946081161499, + "num_tokens": 173308416.0, + "step": 73720 + }, + { + "epoch": 0.6759878976803887, + "learning_rate": 6.480425414871184e-05, + "loss": 0.6814, + "mean_token_accuracy": 0.7905770540237427, + "num_tokens": 173332804.0, + "step": 73730 + }, + { + "epoch": 0.676079581919868, + "learning_rate": 6.478591730081599e-05, + "loss": 0.7081, + "mean_token_accuracy": 0.7803768277168274, + "num_tokens": 173356951.0, + "step": 73740 + }, + { + "epoch": 0.6761712661593472, + "learning_rate": 6.476758045292016e-05, + "loss": 0.6582, + "mean_token_accuracy": 0.7917639195919037, + "num_tokens": 173382580.0, + "step": 73750 + }, + { + "epoch": 0.6762629503988264, + "learning_rate": 6.47492436050243e-05, + "loss": 0.6959, + "mean_token_accuracy": 0.7806162357330322, + "num_tokens": 173407258.0, + "step": 73760 + }, + { + "epoch": 0.6763546346383057, + "learning_rate": 6.473090675712845e-05, + "loss": 0.7088, + "mean_token_accuracy": 0.788748037815094, + "num_tokens": 173432676.0, + "step": 73770 + }, + { + "epoch": 0.676446318877785, + "learning_rate": 6.47125699092326e-05, + "loss": 0.7046, + "mean_token_accuracy": 0.7841828286647796, + "num_tokens": 173457184.0, + "step": 73780 + }, + { + "epoch": 0.6765380031172642, + "learning_rate": 6.469423306133676e-05, + "loss": 0.6905, + "mean_token_accuracy": 0.7858833491802215, + "num_tokens": 173481866.0, + "step": 73790 + }, + { + "epoch": 0.6766296873567433, + "learning_rate": 6.467589621344092e-05, + "loss": 0.6471, + "mean_token_accuracy": 0.7961485326290131, + "num_tokens": 173506678.0, + "step": 73800 + }, + { + "epoch": 0.6767213715962226, + "learning_rate": 6.465755936554507e-05, + "loss": 0.6613, + "mean_token_accuracy": 0.7931310176849365, + "num_tokens": 173531666.0, + "step": 73810 + }, + { + "epoch": 0.6768130558357018, + "learning_rate": 6.463922251764922e-05, + "loss": 0.6936, + "mean_token_accuracy": 0.7924591898918152, + "num_tokens": 173557300.0, + "step": 73820 + }, + { + "epoch": 0.6769047400751811, + "learning_rate": 6.462088566975337e-05, + "loss": 0.7154, + "mean_token_accuracy": 0.785172563791275, + "num_tokens": 173582671.0, + "step": 73830 + }, + { + "epoch": 0.6769964243146603, + "learning_rate": 6.460254882185752e-05, + "loss": 0.7086, + "mean_token_accuracy": 0.7781278610229492, + "num_tokens": 173608046.0, + "step": 73840 + }, + { + "epoch": 0.6770881085541396, + "learning_rate": 6.458421197396169e-05, + "loss": 0.6828, + "mean_token_accuracy": 0.7839238464832305, + "num_tokens": 173632452.0, + "step": 73850 + }, + { + "epoch": 0.6771797927936187, + "learning_rate": 6.456587512606583e-05, + "loss": 0.6882, + "mean_token_accuracy": 0.7890949189662934, + "num_tokens": 173657156.0, + "step": 73860 + }, + { + "epoch": 0.677271477033098, + "learning_rate": 6.454753827816998e-05, + "loss": 0.7067, + "mean_token_accuracy": 0.7835882127285003, + "num_tokens": 173681693.0, + "step": 73870 + }, + { + "epoch": 0.6773631612725772, + "learning_rate": 6.452920143027414e-05, + "loss": 0.6766, + "mean_token_accuracy": 0.7939685761928559, + "num_tokens": 173706987.0, + "step": 73880 + }, + { + "epoch": 0.6774548455120565, + "learning_rate": 6.45108645823783e-05, + "loss": 0.6723, + "mean_token_accuracy": 0.7910866022109986, + "num_tokens": 173732998.0, + "step": 73890 + }, + { + "epoch": 0.6775465297515357, + "learning_rate": 6.449252773448245e-05, + "loss": 0.6639, + "mean_token_accuracy": 0.7986181795597076, + "num_tokens": 173757448.0, + "step": 73900 + }, + { + "epoch": 0.677638213991015, + "learning_rate": 6.44741908865866e-05, + "loss": 0.6625, + "mean_token_accuracy": 0.7926622331142426, + "num_tokens": 173782658.0, + "step": 73910 + }, + { + "epoch": 0.6777298982304942, + "learning_rate": 6.445585403869075e-05, + "loss": 0.686, + "mean_token_accuracy": 0.7847441971302033, + "num_tokens": 173807028.0, + "step": 73920 + }, + { + "epoch": 0.6778215824699734, + "learning_rate": 6.44375171907949e-05, + "loss": 0.6569, + "mean_token_accuracy": 0.7972072541713715, + "num_tokens": 173832264.0, + "step": 73930 + }, + { + "epoch": 0.6779132667094526, + "learning_rate": 6.441918034289906e-05, + "loss": 0.6622, + "mean_token_accuracy": 0.7944561958312988, + "num_tokens": 173857047.0, + "step": 73940 + }, + { + "epoch": 0.6780049509489319, + "learning_rate": 6.440084349500322e-05, + "loss": 0.7022, + "mean_token_accuracy": 0.7907737970352173, + "num_tokens": 173881230.0, + "step": 73950 + }, + { + "epoch": 0.6780966351884111, + "learning_rate": 6.438250664710736e-05, + "loss": 0.6913, + "mean_token_accuracy": 0.7904622495174408, + "num_tokens": 173906479.0, + "step": 73960 + }, + { + "epoch": 0.6781883194278904, + "learning_rate": 6.436416979921151e-05, + "loss": 0.689, + "mean_token_accuracy": 0.787735641002655, + "num_tokens": 173932016.0, + "step": 73970 + }, + { + "epoch": 0.6782800036673696, + "learning_rate": 6.434583295131568e-05, + "loss": 0.659, + "mean_token_accuracy": 0.7958022475242614, + "num_tokens": 173957480.0, + "step": 73980 + }, + { + "epoch": 0.6783716879068488, + "learning_rate": 6.432749610341983e-05, + "loss": 0.6608, + "mean_token_accuracy": 0.79616779088974, + "num_tokens": 173982048.0, + "step": 73990 + }, + { + "epoch": 0.678463372146328, + "learning_rate": 6.430915925552398e-05, + "loss": 0.6986, + "mean_token_accuracy": 0.7894332766532898, + "num_tokens": 174007560.0, + "step": 74000 + }, + { + "epoch": 0.6785550563858073, + "learning_rate": 6.429082240762813e-05, + "loss": 0.7092, + "mean_token_accuracy": 0.786923611164093, + "num_tokens": 174032306.0, + "step": 74010 + }, + { + "epoch": 0.6786467406252865, + "learning_rate": 6.427248555973228e-05, + "loss": 0.6708, + "mean_token_accuracy": 0.7923457264900208, + "num_tokens": 174057463.0, + "step": 74020 + }, + { + "epoch": 0.6787384248647658, + "learning_rate": 6.425414871183644e-05, + "loss": 0.6858, + "mean_token_accuracy": 0.7890528321266175, + "num_tokens": 174081987.0, + "step": 74030 + }, + { + "epoch": 0.678830109104245, + "learning_rate": 6.423581186394059e-05, + "loss": 0.6998, + "mean_token_accuracy": 0.7877249181270599, + "num_tokens": 174106677.0, + "step": 74040 + }, + { + "epoch": 0.6789217933437243, + "learning_rate": 6.421747501604475e-05, + "loss": 0.6567, + "mean_token_accuracy": 0.7965851545333862, + "num_tokens": 174131417.0, + "step": 74050 + }, + { + "epoch": 0.6790134775832034, + "learning_rate": 6.419913816814889e-05, + "loss": 0.6708, + "mean_token_accuracy": 0.7861759960651398, + "num_tokens": 174155799.0, + "step": 74060 + }, + { + "epoch": 0.6791051618226827, + "learning_rate": 6.418080132025304e-05, + "loss": 0.6653, + "mean_token_accuracy": 0.8005099058151245, + "num_tokens": 174180479.0, + "step": 74070 + }, + { + "epoch": 0.6791968460621619, + "learning_rate": 6.416246447235721e-05, + "loss": 0.6853, + "mean_token_accuracy": 0.7853318393230438, + "num_tokens": 174205332.0, + "step": 74080 + }, + { + "epoch": 0.6792885303016412, + "learning_rate": 6.414412762446136e-05, + "loss": 0.6795, + "mean_token_accuracy": 0.7856890499591828, + "num_tokens": 174230762.0, + "step": 74090 + }, + { + "epoch": 0.6793802145411204, + "learning_rate": 6.412579077656551e-05, + "loss": 0.6637, + "mean_token_accuracy": 0.7959155738353729, + "num_tokens": 174256126.0, + "step": 74100 + }, + { + "epoch": 0.6794718987805997, + "learning_rate": 6.410745392866966e-05, + "loss": 0.6963, + "mean_token_accuracy": 0.791889774799347, + "num_tokens": 174281286.0, + "step": 74110 + }, + { + "epoch": 0.6795635830200788, + "learning_rate": 6.408911708077382e-05, + "loss": 0.6779, + "mean_token_accuracy": 0.7931702911853791, + "num_tokens": 174307231.0, + "step": 74120 + }, + { + "epoch": 0.679655267259558, + "learning_rate": 6.407078023287797e-05, + "loss": 0.667, + "mean_token_accuracy": 0.794391143321991, + "num_tokens": 174332261.0, + "step": 74130 + }, + { + "epoch": 0.6797469514990373, + "learning_rate": 6.405244338498212e-05, + "loss": 0.6895, + "mean_token_accuracy": 0.7863744020462036, + "num_tokens": 174357108.0, + "step": 74140 + }, + { + "epoch": 0.6798386357385166, + "learning_rate": 6.403410653708629e-05, + "loss": 0.6753, + "mean_token_accuracy": 0.7901894748210907, + "num_tokens": 174381106.0, + "step": 74150 + }, + { + "epoch": 0.6799303199779958, + "learning_rate": 6.401576968919042e-05, + "loss": 0.6859, + "mean_token_accuracy": 0.7880065619945527, + "num_tokens": 174406090.0, + "step": 74160 + }, + { + "epoch": 0.680022004217475, + "learning_rate": 6.399743284129458e-05, + "loss": 0.6722, + "mean_token_accuracy": 0.7924544394016266, + "num_tokens": 174431369.0, + "step": 74170 + }, + { + "epoch": 0.6801136884569543, + "learning_rate": 6.397909599339874e-05, + "loss": 0.6822, + "mean_token_accuracy": 0.7808837294578552, + "num_tokens": 174455877.0, + "step": 74180 + }, + { + "epoch": 0.6802053726964334, + "learning_rate": 6.396075914550289e-05, + "loss": 0.6809, + "mean_token_accuracy": 0.7911515176296234, + "num_tokens": 174480786.0, + "step": 74190 + }, + { + "epoch": 0.6802970569359127, + "learning_rate": 6.394242229760705e-05, + "loss": 0.661, + "mean_token_accuracy": 0.7959784805774689, + "num_tokens": 174506202.0, + "step": 74200 + }, + { + "epoch": 0.6803887411753919, + "learning_rate": 6.39240854497112e-05, + "loss": 0.6634, + "mean_token_accuracy": 0.7917146682739258, + "num_tokens": 174531727.0, + "step": 74210 + }, + { + "epoch": 0.6804804254148712, + "learning_rate": 6.390574860181535e-05, + "loss": 0.6438, + "mean_token_accuracy": 0.7946355164051055, + "num_tokens": 174556776.0, + "step": 74220 + }, + { + "epoch": 0.6805721096543504, + "learning_rate": 6.38874117539195e-05, + "loss": 0.6838, + "mean_token_accuracy": 0.7886763453483582, + "num_tokens": 174581341.0, + "step": 74230 + }, + { + "epoch": 0.6806637938938297, + "learning_rate": 6.386907490602367e-05, + "loss": 0.7162, + "mean_token_accuracy": 0.7835057616233826, + "num_tokens": 174606350.0, + "step": 74240 + }, + { + "epoch": 0.6807554781333088, + "learning_rate": 6.385073805812782e-05, + "loss": 0.6958, + "mean_token_accuracy": 0.7827196896076203, + "num_tokens": 174630726.0, + "step": 74250 + }, + { + "epoch": 0.6808471623727881, + "learning_rate": 6.383240121023196e-05, + "loss": 0.626, + "mean_token_accuracy": 0.7978158891201019, + "num_tokens": 174656196.0, + "step": 74260 + }, + { + "epoch": 0.6809388466122673, + "learning_rate": 6.381406436233611e-05, + "loss": 0.6436, + "mean_token_accuracy": 0.7940483272075654, + "num_tokens": 174681488.0, + "step": 74270 + }, + { + "epoch": 0.6810305308517466, + "learning_rate": 6.379572751444027e-05, + "loss": 0.68, + "mean_token_accuracy": 0.7875082731246948, + "num_tokens": 174706769.0, + "step": 74280 + }, + { + "epoch": 0.6811222150912258, + "learning_rate": 6.377739066654443e-05, + "loss": 0.7126, + "mean_token_accuracy": 0.783999752998352, + "num_tokens": 174730689.0, + "step": 74290 + }, + { + "epoch": 0.6812138993307051, + "learning_rate": 6.375905381864858e-05, + "loss": 0.6652, + "mean_token_accuracy": 0.7903046488761902, + "num_tokens": 174755620.0, + "step": 74300 + }, + { + "epoch": 0.6813055835701843, + "learning_rate": 6.374071697075273e-05, + "loss": 0.6661, + "mean_token_accuracy": 0.7965183019638061, + "num_tokens": 174780860.0, + "step": 74310 + }, + { + "epoch": 0.6813972678096635, + "learning_rate": 6.372238012285688e-05, + "loss": 0.649, + "mean_token_accuracy": 0.7939989566802979, + "num_tokens": 174806026.0, + "step": 74320 + }, + { + "epoch": 0.6814889520491427, + "learning_rate": 6.370404327496103e-05, + "loss": 0.6817, + "mean_token_accuracy": 0.7914859235286713, + "num_tokens": 174830641.0, + "step": 74330 + }, + { + "epoch": 0.681580636288622, + "learning_rate": 6.36857064270652e-05, + "loss": 0.6668, + "mean_token_accuracy": 0.7908641993999481, + "num_tokens": 174855848.0, + "step": 74340 + }, + { + "epoch": 0.6816723205281012, + "learning_rate": 6.366736957916935e-05, + "loss": 0.6894, + "mean_token_accuracy": 0.7872664928436279, + "num_tokens": 174880558.0, + "step": 74350 + }, + { + "epoch": 0.6817640047675805, + "learning_rate": 6.364903273127349e-05, + "loss": 0.6606, + "mean_token_accuracy": 0.7983326435089111, + "num_tokens": 174904988.0, + "step": 74360 + }, + { + "epoch": 0.6818556890070597, + "learning_rate": 6.363069588337765e-05, + "loss": 0.7119, + "mean_token_accuracy": 0.7824760377407074, + "num_tokens": 174930249.0, + "step": 74370 + }, + { + "epoch": 0.6819473732465389, + "learning_rate": 6.36123590354818e-05, + "loss": 0.675, + "mean_token_accuracy": 0.7913299977779389, + "num_tokens": 174955480.0, + "step": 74380 + }, + { + "epoch": 0.6820390574860181, + "learning_rate": 6.359402218758596e-05, + "loss": 0.6812, + "mean_token_accuracy": 0.7869184613227844, + "num_tokens": 174980423.0, + "step": 74390 + }, + { + "epoch": 0.6821307417254974, + "learning_rate": 6.357568533969011e-05, + "loss": 0.6836, + "mean_token_accuracy": 0.788817697763443, + "num_tokens": 175004986.0, + "step": 74400 + }, + { + "epoch": 0.6822224259649766, + "learning_rate": 6.355734849179426e-05, + "loss": 0.6741, + "mean_token_accuracy": 0.7905064821243286, + "num_tokens": 175030631.0, + "step": 74410 + }, + { + "epoch": 0.6823141102044559, + "learning_rate": 6.353901164389841e-05, + "loss": 0.6826, + "mean_token_accuracy": 0.7935149848461152, + "num_tokens": 175057046.0, + "step": 74420 + }, + { + "epoch": 0.6824057944439351, + "learning_rate": 6.352067479600257e-05, + "loss": 0.6983, + "mean_token_accuracy": 0.7898350715637207, + "num_tokens": 175082393.0, + "step": 74430 + }, + { + "epoch": 0.6824974786834144, + "learning_rate": 6.350233794810673e-05, + "loss": 0.6717, + "mean_token_accuracy": 0.7930544734001159, + "num_tokens": 175108161.0, + "step": 74440 + }, + { + "epoch": 0.6825891629228935, + "learning_rate": 6.348400110021088e-05, + "loss": 0.6927, + "mean_token_accuracy": 0.7862828433513641, + "num_tokens": 175132943.0, + "step": 74450 + }, + { + "epoch": 0.6826808471623728, + "learning_rate": 6.346566425231502e-05, + "loss": 0.6377, + "mean_token_accuracy": 0.7992774963378906, + "num_tokens": 175158109.0, + "step": 74460 + }, + { + "epoch": 0.682772531401852, + "learning_rate": 6.344732740441919e-05, + "loss": 0.6907, + "mean_token_accuracy": 0.7890061199665069, + "num_tokens": 175182649.0, + "step": 74470 + }, + { + "epoch": 0.6828642156413313, + "learning_rate": 6.342899055652334e-05, + "loss": 0.7082, + "mean_token_accuracy": 0.7810740888118743, + "num_tokens": 175208200.0, + "step": 74480 + }, + { + "epoch": 0.6829558998808105, + "learning_rate": 6.341065370862749e-05, + "loss": 0.7035, + "mean_token_accuracy": 0.7838903844356537, + "num_tokens": 175232910.0, + "step": 74490 + }, + { + "epoch": 0.6830475841202898, + "learning_rate": 6.339231686073166e-05, + "loss": 0.652, + "mean_token_accuracy": 0.7972717523574829, + "num_tokens": 175258232.0, + "step": 74500 + }, + { + "epoch": 0.6831392683597689, + "learning_rate": 6.33739800128358e-05, + "loss": 0.6479, + "mean_token_accuracy": 0.7950194478034973, + "num_tokens": 175282824.0, + "step": 74510 + }, + { + "epoch": 0.6832309525992482, + "learning_rate": 6.335564316493995e-05, + "loss": 0.6951, + "mean_token_accuracy": 0.7904062986373901, + "num_tokens": 175307586.0, + "step": 74520 + }, + { + "epoch": 0.6833226368387274, + "learning_rate": 6.33373063170441e-05, + "loss": 0.6757, + "mean_token_accuracy": 0.794041782617569, + "num_tokens": 175332684.0, + "step": 74530 + }, + { + "epoch": 0.6834143210782067, + "learning_rate": 6.331896946914826e-05, + "loss": 0.6795, + "mean_token_accuracy": 0.7868710994720459, + "num_tokens": 175357166.0, + "step": 74540 + }, + { + "epoch": 0.6835060053176859, + "learning_rate": 6.330063262125241e-05, + "loss": 0.7009, + "mean_token_accuracy": 0.787664407491684, + "num_tokens": 175381807.0, + "step": 74550 + }, + { + "epoch": 0.6835976895571652, + "learning_rate": 6.328229577335655e-05, + "loss": 0.6669, + "mean_token_accuracy": 0.7960774600505829, + "num_tokens": 175407486.0, + "step": 74560 + }, + { + "epoch": 0.6836893737966444, + "learning_rate": 6.326395892546072e-05, + "loss": 0.6841, + "mean_token_accuracy": 0.7878939509391785, + "num_tokens": 175431787.0, + "step": 74570 + }, + { + "epoch": 0.6837810580361235, + "learning_rate": 6.324562207756487e-05, + "loss": 0.6767, + "mean_token_accuracy": 0.7889977872371674, + "num_tokens": 175456698.0, + "step": 74580 + }, + { + "epoch": 0.6838727422756028, + "learning_rate": 6.322728522966902e-05, + "loss": 0.7481, + "mean_token_accuracy": 0.7701053440570831, + "num_tokens": 175480707.0, + "step": 74590 + }, + { + "epoch": 0.683964426515082, + "learning_rate": 6.320894838177319e-05, + "loss": 0.6867, + "mean_token_accuracy": 0.7864112198352814, + "num_tokens": 175505215.0, + "step": 74600 + }, + { + "epoch": 0.6840561107545613, + "learning_rate": 6.319061153387733e-05, + "loss": 0.7053, + "mean_token_accuracy": 0.7879898548126221, + "num_tokens": 175529383.0, + "step": 74610 + }, + { + "epoch": 0.6841477949940405, + "learning_rate": 6.317227468598148e-05, + "loss": 0.7052, + "mean_token_accuracy": 0.7819807648658752, + "num_tokens": 175554601.0, + "step": 74620 + }, + { + "epoch": 0.6842394792335198, + "learning_rate": 6.315393783808563e-05, + "loss": 0.6865, + "mean_token_accuracy": 0.7832239806652069, + "num_tokens": 175580848.0, + "step": 74630 + }, + { + "epoch": 0.6843311634729989, + "learning_rate": 6.31356009901898e-05, + "loss": 0.6976, + "mean_token_accuracy": 0.7887556612491607, + "num_tokens": 175605583.0, + "step": 74640 + }, + { + "epoch": 0.6844228477124782, + "learning_rate": 6.311726414229395e-05, + "loss": 0.6877, + "mean_token_accuracy": 0.785181850194931, + "num_tokens": 175630800.0, + "step": 74650 + }, + { + "epoch": 0.6845145319519574, + "learning_rate": 6.309892729439809e-05, + "loss": 0.6557, + "mean_token_accuracy": 0.7960622072219848, + "num_tokens": 175655355.0, + "step": 74660 + }, + { + "epoch": 0.6846062161914367, + "learning_rate": 6.308059044650225e-05, + "loss": 0.6625, + "mean_token_accuracy": 0.7905114889144897, + "num_tokens": 175680500.0, + "step": 74670 + }, + { + "epoch": 0.6846979004309159, + "learning_rate": 6.30622535986064e-05, + "loss": 0.6765, + "mean_token_accuracy": 0.7875080823898315, + "num_tokens": 175706096.0, + "step": 74680 + }, + { + "epoch": 0.6847895846703952, + "learning_rate": 6.304391675071055e-05, + "loss": 0.658, + "mean_token_accuracy": 0.7931058704853058, + "num_tokens": 175731007.0, + "step": 74690 + }, + { + "epoch": 0.6848812689098744, + "learning_rate": 6.302557990281472e-05, + "loss": 0.674, + "mean_token_accuracy": 0.791066724061966, + "num_tokens": 175755634.0, + "step": 74700 + }, + { + "epoch": 0.6849729531493536, + "learning_rate": 6.300724305491886e-05, + "loss": 0.7134, + "mean_token_accuracy": 0.7832394957542419, + "num_tokens": 175780344.0, + "step": 74710 + }, + { + "epoch": 0.6850646373888328, + "learning_rate": 6.298890620702301e-05, + "loss": 0.6556, + "mean_token_accuracy": 0.7953931987285614, + "num_tokens": 175805734.0, + "step": 74720 + }, + { + "epoch": 0.6851563216283121, + "learning_rate": 6.297056935912718e-05, + "loss": 0.6642, + "mean_token_accuracy": 0.7935296833515167, + "num_tokens": 175830590.0, + "step": 74730 + }, + { + "epoch": 0.6852480058677913, + "learning_rate": 6.295223251123133e-05, + "loss": 0.6702, + "mean_token_accuracy": 0.7878190457820893, + "num_tokens": 175855581.0, + "step": 74740 + }, + { + "epoch": 0.6853396901072706, + "learning_rate": 6.293389566333548e-05, + "loss": 0.6586, + "mean_token_accuracy": 0.7975728690624238, + "num_tokens": 175880549.0, + "step": 74750 + }, + { + "epoch": 0.6854313743467498, + "learning_rate": 6.291555881543962e-05, + "loss": 0.6628, + "mean_token_accuracy": 0.7912991404533386, + "num_tokens": 175905071.0, + "step": 74760 + }, + { + "epoch": 0.685523058586229, + "learning_rate": 6.289722196754378e-05, + "loss": 0.6697, + "mean_token_accuracy": 0.7938998997211456, + "num_tokens": 175930188.0, + "step": 74770 + }, + { + "epoch": 0.6856147428257082, + "learning_rate": 6.287888511964793e-05, + "loss": 0.6793, + "mean_token_accuracy": 0.7936573028564453, + "num_tokens": 175955489.0, + "step": 74780 + }, + { + "epoch": 0.6857064270651875, + "learning_rate": 6.286054827175209e-05, + "loss": 0.6707, + "mean_token_accuracy": 0.7974761843681335, + "num_tokens": 175980142.0, + "step": 74790 + }, + { + "epoch": 0.6857981113046667, + "learning_rate": 6.284221142385625e-05, + "loss": 0.6872, + "mean_token_accuracy": 0.7910990118980408, + "num_tokens": 176005801.0, + "step": 74800 + }, + { + "epoch": 0.685889795544146, + "learning_rate": 6.282387457596039e-05, + "loss": 0.7063, + "mean_token_accuracy": 0.788154023885727, + "num_tokens": 176031557.0, + "step": 74810 + }, + { + "epoch": 0.6859814797836252, + "learning_rate": 6.280553772806454e-05, + "loss": 0.6789, + "mean_token_accuracy": 0.7894406259059906, + "num_tokens": 176056786.0, + "step": 74820 + }, + { + "epoch": 0.6860731640231045, + "learning_rate": 6.278720088016871e-05, + "loss": 0.689, + "mean_token_accuracy": 0.7851300597190857, + "num_tokens": 176081316.0, + "step": 74830 + }, + { + "epoch": 0.6861648482625836, + "learning_rate": 6.276886403227286e-05, + "loss": 0.6962, + "mean_token_accuracy": 0.7852903544902802, + "num_tokens": 176106431.0, + "step": 74840 + }, + { + "epoch": 0.6862565325020629, + "learning_rate": 6.275052718437701e-05, + "loss": 0.6942, + "mean_token_accuracy": 0.7856343805789947, + "num_tokens": 176132456.0, + "step": 74850 + }, + { + "epoch": 0.6863482167415421, + "learning_rate": 6.273219033648116e-05, + "loss": 0.6819, + "mean_token_accuracy": 0.7907595276832581, + "num_tokens": 176157247.0, + "step": 74860 + }, + { + "epoch": 0.6864399009810214, + "learning_rate": 6.271385348858532e-05, + "loss": 0.6958, + "mean_token_accuracy": 0.7894757807254791, + "num_tokens": 176182554.0, + "step": 74870 + }, + { + "epoch": 0.6865315852205006, + "learning_rate": 6.269551664068947e-05, + "loss": 0.6695, + "mean_token_accuracy": 0.789708924293518, + "num_tokens": 176207647.0, + "step": 74880 + }, + { + "epoch": 0.6866232694599799, + "learning_rate": 6.267717979279362e-05, + "loss": 0.6944, + "mean_token_accuracy": 0.788169902563095, + "num_tokens": 176232333.0, + "step": 74890 + }, + { + "epoch": 0.686714953699459, + "learning_rate": 6.265884294489778e-05, + "loss": 0.6958, + "mean_token_accuracy": 0.7871954560279846, + "num_tokens": 176256999.0, + "step": 74900 + }, + { + "epoch": 0.6868066379389383, + "learning_rate": 6.264050609700192e-05, + "loss": 0.674, + "mean_token_accuracy": 0.7925026893615723, + "num_tokens": 176282468.0, + "step": 74910 + }, + { + "epoch": 0.6868983221784175, + "learning_rate": 6.262216924910607e-05, + "loss": 0.684, + "mean_token_accuracy": 0.7899601221084595, + "num_tokens": 176307350.0, + "step": 74920 + }, + { + "epoch": 0.6869900064178968, + "learning_rate": 6.260383240121024e-05, + "loss": 0.7292, + "mean_token_accuracy": 0.7792982399463654, + "num_tokens": 176332281.0, + "step": 74930 + }, + { + "epoch": 0.687081690657376, + "learning_rate": 6.258549555331439e-05, + "loss": 0.6984, + "mean_token_accuracy": 0.7857298851013184, + "num_tokens": 176356415.0, + "step": 74940 + }, + { + "epoch": 0.6871733748968553, + "learning_rate": 6.256715870541854e-05, + "loss": 0.6982, + "mean_token_accuracy": 0.7876420080661773, + "num_tokens": 176381918.0, + "step": 74950 + }, + { + "epoch": 0.6872650591363345, + "learning_rate": 6.25488218575227e-05, + "loss": 0.7004, + "mean_token_accuracy": 0.7868048846721649, + "num_tokens": 176408042.0, + "step": 74960 + }, + { + "epoch": 0.6873567433758137, + "learning_rate": 6.253048500962685e-05, + "loss": 0.6993, + "mean_token_accuracy": 0.7900464177131653, + "num_tokens": 176433361.0, + "step": 74970 + }, + { + "epoch": 0.6874484276152929, + "learning_rate": 6.2512148161731e-05, + "loss": 0.6782, + "mean_token_accuracy": 0.791328901052475, + "num_tokens": 176458697.0, + "step": 74980 + }, + { + "epoch": 0.6875401118547722, + "learning_rate": 6.249381131383516e-05, + "loss": 0.6399, + "mean_token_accuracy": 0.8019151329994202, + "num_tokens": 176484658.0, + "step": 74990 + }, + { + "epoch": 0.6876317960942514, + "learning_rate": 6.247547446593932e-05, + "loss": 0.6879, + "mean_token_accuracy": 0.7877026379108429, + "num_tokens": 176509669.0, + "step": 75000 + }, + { + "epoch": 0.6877234803337307, + "learning_rate": 6.245713761804345e-05, + "loss": 0.6717, + "mean_token_accuracy": 0.793970137834549, + "num_tokens": 176534034.0, + "step": 75010 + }, + { + "epoch": 0.6878151645732099, + "learning_rate": 6.24388007701476e-05, + "loss": 0.6699, + "mean_token_accuracy": 0.7973458468914032, + "num_tokens": 176559260.0, + "step": 75020 + }, + { + "epoch": 0.6879068488126892, + "learning_rate": 6.242046392225177e-05, + "loss": 0.6774, + "mean_token_accuracy": 0.7890937805175782, + "num_tokens": 176584684.0, + "step": 75030 + }, + { + "epoch": 0.6879985330521683, + "learning_rate": 6.240212707435592e-05, + "loss": 0.6848, + "mean_token_accuracy": 0.7890117824077606, + "num_tokens": 176610226.0, + "step": 75040 + }, + { + "epoch": 0.6880902172916475, + "learning_rate": 6.238379022646008e-05, + "loss": 0.7119, + "mean_token_accuracy": 0.7836406707763672, + "num_tokens": 176635726.0, + "step": 75050 + }, + { + "epoch": 0.6881819015311268, + "learning_rate": 6.236545337856423e-05, + "loss": 0.6726, + "mean_token_accuracy": 0.793917179107666, + "num_tokens": 176660949.0, + "step": 75060 + }, + { + "epoch": 0.688273585770606, + "learning_rate": 6.234711653066838e-05, + "loss": 0.6581, + "mean_token_accuracy": 0.7956817448139191, + "num_tokens": 176686556.0, + "step": 75070 + }, + { + "epoch": 0.6883652700100853, + "learning_rate": 6.232877968277253e-05, + "loss": 0.6844, + "mean_token_accuracy": 0.7914393424987793, + "num_tokens": 176712147.0, + "step": 75080 + }, + { + "epoch": 0.6884569542495645, + "learning_rate": 6.23104428348767e-05, + "loss": 0.6749, + "mean_token_accuracy": 0.7879520237445832, + "num_tokens": 176738115.0, + "step": 75090 + }, + { + "epoch": 0.6885486384890437, + "learning_rate": 6.229210598698085e-05, + "loss": 0.6593, + "mean_token_accuracy": 0.7963025748729706, + "num_tokens": 176763003.0, + "step": 75100 + }, + { + "epoch": 0.6886403227285229, + "learning_rate": 6.227376913908499e-05, + "loss": 0.6585, + "mean_token_accuracy": 0.7946280837059021, + "num_tokens": 176788072.0, + "step": 75110 + }, + { + "epoch": 0.6887320069680022, + "learning_rate": 6.225543229118915e-05, + "loss": 0.67, + "mean_token_accuracy": 0.7864981591701508, + "num_tokens": 176812355.0, + "step": 75120 + }, + { + "epoch": 0.6888236912074814, + "learning_rate": 6.22370954432933e-05, + "loss": 0.6627, + "mean_token_accuracy": 0.7990666508674622, + "num_tokens": 176837879.0, + "step": 75130 + }, + { + "epoch": 0.6889153754469607, + "learning_rate": 6.221875859539746e-05, + "loss": 0.6846, + "mean_token_accuracy": 0.7910236716270447, + "num_tokens": 176863173.0, + "step": 75140 + }, + { + "epoch": 0.6890070596864399, + "learning_rate": 6.220042174750161e-05, + "loss": 0.7191, + "mean_token_accuracy": 0.7803408920764923, + "num_tokens": 176887485.0, + "step": 75150 + }, + { + "epoch": 0.6890987439259192, + "learning_rate": 6.218208489960576e-05, + "loss": 0.6582, + "mean_token_accuracy": 0.7980068564414978, + "num_tokens": 176912921.0, + "step": 75160 + }, + { + "epoch": 0.6891904281653983, + "learning_rate": 6.216374805170991e-05, + "loss": 0.7019, + "mean_token_accuracy": 0.7854265809059143, + "num_tokens": 176937210.0, + "step": 75170 + }, + { + "epoch": 0.6892821124048776, + "learning_rate": 6.214541120381406e-05, + "loss": 0.6882, + "mean_token_accuracy": 0.7832460999488831, + "num_tokens": 176961269.0, + "step": 75180 + }, + { + "epoch": 0.6893737966443568, + "learning_rate": 6.212707435591823e-05, + "loss": 0.6857, + "mean_token_accuracy": 0.7883375585079193, + "num_tokens": 176986388.0, + "step": 75190 + }, + { + "epoch": 0.6894654808838361, + "learning_rate": 6.210873750802238e-05, + "loss": 0.6956, + "mean_token_accuracy": 0.7831620633602142, + "num_tokens": 177011397.0, + "step": 75200 + }, + { + "epoch": 0.6895571651233153, + "learning_rate": 6.209040066012652e-05, + "loss": 0.6854, + "mean_token_accuracy": 0.7810591638088227, + "num_tokens": 177036885.0, + "step": 75210 + }, + { + "epoch": 0.6896488493627946, + "learning_rate": 6.207206381223068e-05, + "loss": 0.6611, + "mean_token_accuracy": 0.7925475060939788, + "num_tokens": 177062510.0, + "step": 75220 + }, + { + "epoch": 0.6897405336022737, + "learning_rate": 6.205372696433484e-05, + "loss": 0.6533, + "mean_token_accuracy": 0.7994494497776031, + "num_tokens": 177086825.0, + "step": 75230 + }, + { + "epoch": 0.689832217841753, + "learning_rate": 6.203539011643899e-05, + "loss": 0.6987, + "mean_token_accuracy": 0.7893237888813018, + "num_tokens": 177111978.0, + "step": 75240 + }, + { + "epoch": 0.6899239020812322, + "learning_rate": 6.201705326854314e-05, + "loss": 0.6868, + "mean_token_accuracy": 0.7898162841796875, + "num_tokens": 177137586.0, + "step": 75250 + }, + { + "epoch": 0.6900155863207115, + "learning_rate": 6.199871642064729e-05, + "loss": 0.6605, + "mean_token_accuracy": 0.7909402132034302, + "num_tokens": 177163012.0, + "step": 75260 + }, + { + "epoch": 0.6901072705601907, + "learning_rate": 6.198037957275144e-05, + "loss": 0.6866, + "mean_token_accuracy": 0.7860115885734558, + "num_tokens": 177188443.0, + "step": 75270 + }, + { + "epoch": 0.69019895479967, + "learning_rate": 6.19620427248556e-05, + "loss": 0.6926, + "mean_token_accuracy": 0.7854578197002411, + "num_tokens": 177212813.0, + "step": 75280 + }, + { + "epoch": 0.6902906390391492, + "learning_rate": 6.194370587695976e-05, + "loss": 0.6944, + "mean_token_accuracy": 0.7880738377571106, + "num_tokens": 177238263.0, + "step": 75290 + }, + { + "epoch": 0.6903823232786284, + "learning_rate": 6.192536902906391e-05, + "loss": 0.7251, + "mean_token_accuracy": 0.7831411898136139, + "num_tokens": 177263489.0, + "step": 75300 + }, + { + "epoch": 0.6904740075181076, + "learning_rate": 6.190703218116805e-05, + "loss": 0.6338, + "mean_token_accuracy": 0.801439744234085, + "num_tokens": 177288428.0, + "step": 75310 + }, + { + "epoch": 0.6905656917575869, + "learning_rate": 6.188869533327222e-05, + "loss": 0.6824, + "mean_token_accuracy": 0.7955764472484589, + "num_tokens": 177313945.0, + "step": 75320 + }, + { + "epoch": 0.6906573759970661, + "learning_rate": 6.187035848537637e-05, + "loss": 0.6987, + "mean_token_accuracy": 0.7869789004325867, + "num_tokens": 177339227.0, + "step": 75330 + }, + { + "epoch": 0.6907490602365454, + "learning_rate": 6.185202163748052e-05, + "loss": 0.6667, + "mean_token_accuracy": 0.7907529294490814, + "num_tokens": 177363411.0, + "step": 75340 + }, + { + "epoch": 0.6908407444760246, + "learning_rate": 6.183368478958467e-05, + "loss": 0.6942, + "mean_token_accuracy": 0.7806631922721863, + "num_tokens": 177387858.0, + "step": 75350 + }, + { + "epoch": 0.6909324287155038, + "learning_rate": 6.181534794168882e-05, + "loss": 0.6747, + "mean_token_accuracy": 0.792816162109375, + "num_tokens": 177414118.0, + "step": 75360 + }, + { + "epoch": 0.691024112954983, + "learning_rate": 6.179701109379298e-05, + "loss": 0.6949, + "mean_token_accuracy": 0.7874690413475036, + "num_tokens": 177438751.0, + "step": 75370 + }, + { + "epoch": 0.6911157971944623, + "learning_rate": 6.177867424589713e-05, + "loss": 0.6898, + "mean_token_accuracy": 0.7809600532054901, + "num_tokens": 177463691.0, + "step": 75380 + }, + { + "epoch": 0.6912074814339415, + "learning_rate": 6.17603373980013e-05, + "loss": 0.6795, + "mean_token_accuracy": 0.7870772123336792, + "num_tokens": 177488303.0, + "step": 75390 + }, + { + "epoch": 0.6912991656734208, + "learning_rate": 6.174200055010545e-05, + "loss": 0.6601, + "mean_token_accuracy": 0.7902093172073364, + "num_tokens": 177513019.0, + "step": 75400 + }, + { + "epoch": 0.6913908499129, + "learning_rate": 6.172366370220958e-05, + "loss": 0.6664, + "mean_token_accuracy": 0.7936054110527039, + "num_tokens": 177537750.0, + "step": 75410 + }, + { + "epoch": 0.6914825341523793, + "learning_rate": 6.170532685431375e-05, + "loss": 0.6764, + "mean_token_accuracy": 0.7926254570484161, + "num_tokens": 177563617.0, + "step": 75420 + }, + { + "epoch": 0.6915742183918584, + "learning_rate": 6.16869900064179e-05, + "loss": 0.6905, + "mean_token_accuracy": 0.7925673961639405, + "num_tokens": 177590017.0, + "step": 75430 + }, + { + "epoch": 0.6916659026313376, + "learning_rate": 6.166865315852205e-05, + "loss": 0.6711, + "mean_token_accuracy": 0.7915888249874115, + "num_tokens": 177615609.0, + "step": 75440 + }, + { + "epoch": 0.6917575868708169, + "learning_rate": 6.16503163106262e-05, + "loss": 0.6932, + "mean_token_accuracy": 0.7848492503166199, + "num_tokens": 177641094.0, + "step": 75450 + }, + { + "epoch": 0.6918492711102961, + "learning_rate": 6.163197946273036e-05, + "loss": 0.691, + "mean_token_accuracy": 0.7870258510112762, + "num_tokens": 177665845.0, + "step": 75460 + }, + { + "epoch": 0.6919409553497754, + "learning_rate": 6.161364261483451e-05, + "loss": 0.6693, + "mean_token_accuracy": 0.7906091928482055, + "num_tokens": 177691782.0, + "step": 75470 + }, + { + "epoch": 0.6920326395892547, + "learning_rate": 6.159530576693867e-05, + "loss": 0.6525, + "mean_token_accuracy": 0.7949664413928985, + "num_tokens": 177716605.0, + "step": 75480 + }, + { + "epoch": 0.6921243238287338, + "learning_rate": 6.157696891904283e-05, + "loss": 0.676, + "mean_token_accuracy": 0.7979806184768676, + "num_tokens": 177741785.0, + "step": 75490 + }, + { + "epoch": 0.692216008068213, + "learning_rate": 6.155863207114698e-05, + "loss": 0.6735, + "mean_token_accuracy": 0.7911450088024139, + "num_tokens": 177767958.0, + "step": 75500 + }, + { + "epoch": 0.6923076923076923, + "learning_rate": 6.154029522325112e-05, + "loss": 0.6486, + "mean_token_accuracy": 0.8005157113075256, + "num_tokens": 177792220.0, + "step": 75510 + }, + { + "epoch": 0.6923993765471715, + "learning_rate": 6.152195837535528e-05, + "loss": 0.6788, + "mean_token_accuracy": 0.7899494409561157, + "num_tokens": 177817232.0, + "step": 75520 + }, + { + "epoch": 0.6924910607866508, + "learning_rate": 6.150362152745943e-05, + "loss": 0.6877, + "mean_token_accuracy": 0.7852452516555786, + "num_tokens": 177842140.0, + "step": 75530 + }, + { + "epoch": 0.69258274502613, + "learning_rate": 6.148528467956359e-05, + "loss": 0.6645, + "mean_token_accuracy": 0.7939651489257813, + "num_tokens": 177867930.0, + "step": 75540 + }, + { + "epoch": 0.6926744292656093, + "learning_rate": 6.146694783166774e-05, + "loss": 0.7164, + "mean_token_accuracy": 0.7811005592346192, + "num_tokens": 177892720.0, + "step": 75550 + }, + { + "epoch": 0.6927661135050884, + "learning_rate": 6.144861098377189e-05, + "loss": 0.7102, + "mean_token_accuracy": 0.7842880129814148, + "num_tokens": 177917877.0, + "step": 75560 + }, + { + "epoch": 0.6928577977445677, + "learning_rate": 6.143027413587604e-05, + "loss": 0.6923, + "mean_token_accuracy": 0.782748019695282, + "num_tokens": 177943076.0, + "step": 75570 + }, + { + "epoch": 0.6929494819840469, + "learning_rate": 6.14119372879802e-05, + "loss": 0.6618, + "mean_token_accuracy": 0.7946770131587982, + "num_tokens": 177968703.0, + "step": 75580 + }, + { + "epoch": 0.6930411662235262, + "learning_rate": 6.139360044008436e-05, + "loss": 0.6828, + "mean_token_accuracy": 0.7888063311576843, + "num_tokens": 177993985.0, + "step": 75590 + }, + { + "epoch": 0.6931328504630054, + "learning_rate": 6.137526359218851e-05, + "loss": 0.6891, + "mean_token_accuracy": 0.779136347770691, + "num_tokens": 178018934.0, + "step": 75600 + }, + { + "epoch": 0.6932245347024847, + "learning_rate": 6.135692674429266e-05, + "loss": 0.6589, + "mean_token_accuracy": 0.7927046358585358, + "num_tokens": 178044845.0, + "step": 75610 + }, + { + "epoch": 0.6933162189419638, + "learning_rate": 6.133858989639681e-05, + "loss": 0.6808, + "mean_token_accuracy": 0.788493013381958, + "num_tokens": 178070021.0, + "step": 75620 + }, + { + "epoch": 0.6934079031814431, + "learning_rate": 6.132025304850097e-05, + "loss": 0.722, + "mean_token_accuracy": 0.7846109211444855, + "num_tokens": 178095090.0, + "step": 75630 + }, + { + "epoch": 0.6934995874209223, + "learning_rate": 6.130191620060512e-05, + "loss": 0.6734, + "mean_token_accuracy": 0.7920516550540924, + "num_tokens": 178120327.0, + "step": 75640 + }, + { + "epoch": 0.6935912716604016, + "learning_rate": 6.128357935270927e-05, + "loss": 0.6597, + "mean_token_accuracy": 0.7969824314117432, + "num_tokens": 178145092.0, + "step": 75650 + }, + { + "epoch": 0.6936829558998808, + "learning_rate": 6.126524250481342e-05, + "loss": 0.7192, + "mean_token_accuracy": 0.7807035684585572, + "num_tokens": 178169803.0, + "step": 75660 + }, + { + "epoch": 0.6937746401393601, + "learning_rate": 6.124690565691757e-05, + "loss": 0.6721, + "mean_token_accuracy": 0.7994394123554229, + "num_tokens": 178195806.0, + "step": 75670 + }, + { + "epoch": 0.6938663243788393, + "learning_rate": 6.122856880902174e-05, + "loss": 0.7059, + "mean_token_accuracy": 0.7798124194145203, + "num_tokens": 178220866.0, + "step": 75680 + }, + { + "epoch": 0.6939580086183185, + "learning_rate": 6.121023196112589e-05, + "loss": 0.6599, + "mean_token_accuracy": 0.7958055436611176, + "num_tokens": 178245969.0, + "step": 75690 + }, + { + "epoch": 0.6940496928577977, + "learning_rate": 6.119189511323004e-05, + "loss": 0.6593, + "mean_token_accuracy": 0.7950552761554718, + "num_tokens": 178271298.0, + "step": 75700 + }, + { + "epoch": 0.694141377097277, + "learning_rate": 6.11735582653342e-05, + "loss": 0.6692, + "mean_token_accuracy": 0.7914415419101715, + "num_tokens": 178296247.0, + "step": 75710 + }, + { + "epoch": 0.6942330613367562, + "learning_rate": 6.115522141743835e-05, + "loss": 0.6735, + "mean_token_accuracy": 0.7871362745761872, + "num_tokens": 178321619.0, + "step": 75720 + }, + { + "epoch": 0.6943247455762355, + "learning_rate": 6.11368845695425e-05, + "loss": 0.7062, + "mean_token_accuracy": 0.7866231739521027, + "num_tokens": 178346554.0, + "step": 75730 + }, + { + "epoch": 0.6944164298157147, + "learning_rate": 6.111854772164666e-05, + "loss": 0.6786, + "mean_token_accuracy": 0.7940635979175568, + "num_tokens": 178371551.0, + "step": 75740 + }, + { + "epoch": 0.6945081140551939, + "learning_rate": 6.11002108737508e-05, + "loss": 0.6367, + "mean_token_accuracy": 0.8015643656253815, + "num_tokens": 178396997.0, + "step": 75750 + }, + { + "epoch": 0.6945997982946731, + "learning_rate": 6.108187402585495e-05, + "loss": 0.6738, + "mean_token_accuracy": 0.7952834844589234, + "num_tokens": 178421864.0, + "step": 75760 + }, + { + "epoch": 0.6946914825341524, + "learning_rate": 6.10635371779591e-05, + "loss": 0.6645, + "mean_token_accuracy": 0.7930844902992249, + "num_tokens": 178447351.0, + "step": 75770 + }, + { + "epoch": 0.6947831667736316, + "learning_rate": 6.104520033006327e-05, + "loss": 0.7042, + "mean_token_accuracy": 0.7845900595188141, + "num_tokens": 178472558.0, + "step": 75780 + }, + { + "epoch": 0.6948748510131109, + "learning_rate": 6.1026863482167416e-05, + "loss": 0.6677, + "mean_token_accuracy": 0.7874324023723602, + "num_tokens": 178497672.0, + "step": 75790 + }, + { + "epoch": 0.6949665352525901, + "learning_rate": 6.100852663427157e-05, + "loss": 0.7032, + "mean_token_accuracy": 0.7855457067489624, + "num_tokens": 178521761.0, + "step": 75800 + }, + { + "epoch": 0.6950582194920694, + "learning_rate": 6.0990189786375726e-05, + "loss": 0.7079, + "mean_token_accuracy": 0.7808915078639984, + "num_tokens": 178546512.0, + "step": 75810 + }, + { + "epoch": 0.6951499037315485, + "learning_rate": 6.097185293847988e-05, + "loss": 0.6691, + "mean_token_accuracy": 0.7944140315055848, + "num_tokens": 178572627.0, + "step": 75820 + }, + { + "epoch": 0.6952415879710278, + "learning_rate": 6.095351609058403e-05, + "loss": 0.706, + "mean_token_accuracy": 0.7832296431064606, + "num_tokens": 178598214.0, + "step": 75830 + }, + { + "epoch": 0.695333272210507, + "learning_rate": 6.093517924268819e-05, + "loss": 0.7282, + "mean_token_accuracy": 0.7790860772132874, + "num_tokens": 178623376.0, + "step": 75840 + }, + { + "epoch": 0.6954249564499863, + "learning_rate": 6.091684239479234e-05, + "loss": 0.6928, + "mean_token_accuracy": 0.7807729482650757, + "num_tokens": 178648911.0, + "step": 75850 + }, + { + "epoch": 0.6955166406894655, + "learning_rate": 6.089850554689649e-05, + "loss": 0.7165, + "mean_token_accuracy": 0.7829519927501678, + "num_tokens": 178674426.0, + "step": 75860 + }, + { + "epoch": 0.6956083249289448, + "learning_rate": 6.088016869900064e-05, + "loss": 0.6753, + "mean_token_accuracy": 0.7965818285942078, + "num_tokens": 178699367.0, + "step": 75870 + }, + { + "epoch": 0.6957000091684239, + "learning_rate": 6.08618318511048e-05, + "loss": 0.6931, + "mean_token_accuracy": 0.7931291162967682, + "num_tokens": 178723765.0, + "step": 75880 + }, + { + "epoch": 0.6957916934079031, + "learning_rate": 6.084349500320895e-05, + "loss": 0.682, + "mean_token_accuracy": 0.7902142465114593, + "num_tokens": 178748686.0, + "step": 75890 + }, + { + "epoch": 0.6958833776473824, + "learning_rate": 6.08251581553131e-05, + "loss": 0.6778, + "mean_token_accuracy": 0.7876346409320831, + "num_tokens": 178772815.0, + "step": 75900 + }, + { + "epoch": 0.6959750618868616, + "learning_rate": 6.080682130741726e-05, + "loss": 0.6933, + "mean_token_accuracy": 0.787034273147583, + "num_tokens": 178797692.0, + "step": 75910 + }, + { + "epoch": 0.6960667461263409, + "learning_rate": 6.078848445952141e-05, + "loss": 0.6792, + "mean_token_accuracy": 0.7882838785648346, + "num_tokens": 178823018.0, + "step": 75920 + }, + { + "epoch": 0.6961584303658201, + "learning_rate": 6.077014761162556e-05, + "loss": 0.6752, + "mean_token_accuracy": 0.7874985039234161, + "num_tokens": 178848157.0, + "step": 75930 + }, + { + "epoch": 0.6962501146052994, + "learning_rate": 6.075181076372972e-05, + "loss": 0.6875, + "mean_token_accuracy": 0.7919121146202087, + "num_tokens": 178873190.0, + "step": 75940 + }, + { + "epoch": 0.6963417988447785, + "learning_rate": 6.073347391583387e-05, + "loss": 0.6829, + "mean_token_accuracy": 0.792927211523056, + "num_tokens": 178899419.0, + "step": 75950 + }, + { + "epoch": 0.6964334830842578, + "learning_rate": 6.0715137067938024e-05, + "loss": 0.6725, + "mean_token_accuracy": 0.7921659231185914, + "num_tokens": 178924798.0, + "step": 75960 + }, + { + "epoch": 0.696525167323737, + "learning_rate": 6.069680022004218e-05, + "loss": 0.6586, + "mean_token_accuracy": 0.7956588447093964, + "num_tokens": 178950818.0, + "step": 75970 + }, + { + "epoch": 0.6966168515632163, + "learning_rate": 6.0678463372146335e-05, + "loss": 0.6736, + "mean_token_accuracy": 0.7838387608528137, + "num_tokens": 178976757.0, + "step": 75980 + }, + { + "epoch": 0.6967085358026955, + "learning_rate": 6.066012652425048e-05, + "loss": 0.7003, + "mean_token_accuracy": 0.7866319477558136, + "num_tokens": 179001693.0, + "step": 75990 + }, + { + "epoch": 0.6968002200421748, + "learning_rate": 6.064178967635463e-05, + "loss": 0.6691, + "mean_token_accuracy": 0.7886835098266601, + "num_tokens": 179026674.0, + "step": 76000 + }, + { + "epoch": 0.6968919042816539, + "learning_rate": 6.062345282845879e-05, + "loss": 0.6592, + "mean_token_accuracy": 0.7934810280799866, + "num_tokens": 179051807.0, + "step": 76010 + }, + { + "epoch": 0.6969835885211332, + "learning_rate": 6.060511598056294e-05, + "loss": 0.6687, + "mean_token_accuracy": 0.7910148620605468, + "num_tokens": 179077149.0, + "step": 76020 + }, + { + "epoch": 0.6970752727606124, + "learning_rate": 6.0586779132667094e-05, + "loss": 0.6614, + "mean_token_accuracy": 0.7928116798400879, + "num_tokens": 179102955.0, + "step": 76030 + }, + { + "epoch": 0.6971669570000917, + "learning_rate": 6.056844228477125e-05, + "loss": 0.6844, + "mean_token_accuracy": 0.7920890152454376, + "num_tokens": 179128374.0, + "step": 76040 + }, + { + "epoch": 0.6972586412395709, + "learning_rate": 6.0550105436875405e-05, + "loss": 0.6918, + "mean_token_accuracy": 0.7865221977233887, + "num_tokens": 179153390.0, + "step": 76050 + }, + { + "epoch": 0.6973503254790502, + "learning_rate": 6.053176858897956e-05, + "loss": 0.6735, + "mean_token_accuracy": 0.7937344133853912, + "num_tokens": 179178350.0, + "step": 76060 + }, + { + "epoch": 0.6974420097185294, + "learning_rate": 6.0513431741083715e-05, + "loss": 0.664, + "mean_token_accuracy": 0.7925346910953521, + "num_tokens": 179202990.0, + "step": 76070 + }, + { + "epoch": 0.6975336939580086, + "learning_rate": 6.049509489318787e-05, + "loss": 0.681, + "mean_token_accuracy": 0.7910955011844635, + "num_tokens": 179228708.0, + "step": 76080 + }, + { + "epoch": 0.6976253781974878, + "learning_rate": 6.047675804529201e-05, + "loss": 0.7205, + "mean_token_accuracy": 0.7769014358520507, + "num_tokens": 179254154.0, + "step": 76090 + }, + { + "epoch": 0.6977170624369671, + "learning_rate": 6.045842119739618e-05, + "loss": 0.6712, + "mean_token_accuracy": 0.7906412899494171, + "num_tokens": 179279894.0, + "step": 76100 + }, + { + "epoch": 0.6978087466764463, + "learning_rate": 6.044008434950032e-05, + "loss": 0.6632, + "mean_token_accuracy": 0.7903281688690186, + "num_tokens": 179304958.0, + "step": 76110 + }, + { + "epoch": 0.6979004309159256, + "learning_rate": 6.0421747501604475e-05, + "loss": 0.6502, + "mean_token_accuracy": 0.7969510674476623, + "num_tokens": 179329896.0, + "step": 76120 + }, + { + "epoch": 0.6979921151554048, + "learning_rate": 6.0403410653708627e-05, + "loss": 0.6948, + "mean_token_accuracy": 0.7847719728946686, + "num_tokens": 179354591.0, + "step": 76130 + }, + { + "epoch": 0.6980837993948841, + "learning_rate": 6.0385073805812785e-05, + "loss": 0.7005, + "mean_token_accuracy": 0.7879184305667877, + "num_tokens": 179380583.0, + "step": 76140 + }, + { + "epoch": 0.6981754836343632, + "learning_rate": 6.036673695791694e-05, + "loss": 0.6927, + "mean_token_accuracy": 0.7896237909793854, + "num_tokens": 179405606.0, + "step": 76150 + }, + { + "epoch": 0.6982671678738425, + "learning_rate": 6.034840011002109e-05, + "loss": 0.6773, + "mean_token_accuracy": 0.7949445068836212, + "num_tokens": 179431105.0, + "step": 76160 + }, + { + "epoch": 0.6983588521133217, + "learning_rate": 6.033006326212525e-05, + "loss": 0.67, + "mean_token_accuracy": 0.7901997804641724, + "num_tokens": 179456593.0, + "step": 76170 + }, + { + "epoch": 0.698450536352801, + "learning_rate": 6.03117264142294e-05, + "loss": 0.6815, + "mean_token_accuracy": 0.7900418698787689, + "num_tokens": 179481639.0, + "step": 76180 + }, + { + "epoch": 0.6985422205922802, + "learning_rate": 6.0293389566333545e-05, + "loss": 0.6631, + "mean_token_accuracy": 0.7938229978084564, + "num_tokens": 179507111.0, + "step": 76190 + }, + { + "epoch": 0.6986339048317595, + "learning_rate": 6.027505271843771e-05, + "loss": 0.6655, + "mean_token_accuracy": 0.791388314962387, + "num_tokens": 179532400.0, + "step": 76200 + }, + { + "epoch": 0.6987255890712386, + "learning_rate": 6.0256715870541855e-05, + "loss": 0.6608, + "mean_token_accuracy": 0.7964693009853363, + "num_tokens": 179557888.0, + "step": 76210 + }, + { + "epoch": 0.6988172733107179, + "learning_rate": 6.023837902264601e-05, + "loss": 0.6949, + "mean_token_accuracy": 0.7877890586853027, + "num_tokens": 179583210.0, + "step": 76220 + }, + { + "epoch": 0.6989089575501971, + "learning_rate": 6.0220042174750166e-05, + "loss": 0.706, + "mean_token_accuracy": 0.7825822949409484, + "num_tokens": 179609231.0, + "step": 76230 + }, + { + "epoch": 0.6990006417896764, + "learning_rate": 6.020170532685432e-05, + "loss": 0.6495, + "mean_token_accuracy": 0.8009159028530121, + "num_tokens": 179634299.0, + "step": 76240 + }, + { + "epoch": 0.6990923260291556, + "learning_rate": 6.018336847895847e-05, + "loss": 0.6879, + "mean_token_accuracy": 0.7836112380027771, + "num_tokens": 179659224.0, + "step": 76250 + }, + { + "epoch": 0.6991840102686349, + "learning_rate": 6.016503163106262e-05, + "loss": 0.7075, + "mean_token_accuracy": 0.7844682037830353, + "num_tokens": 179684487.0, + "step": 76260 + }, + { + "epoch": 0.6992756945081141, + "learning_rate": 6.014669478316678e-05, + "loss": 0.7047, + "mean_token_accuracy": 0.7841387391090393, + "num_tokens": 179709986.0, + "step": 76270 + }, + { + "epoch": 0.6993673787475932, + "learning_rate": 6.012835793527093e-05, + "loss": 0.6919, + "mean_token_accuracy": 0.7843936502933502, + "num_tokens": 179735307.0, + "step": 76280 + }, + { + "epoch": 0.6994590629870725, + "learning_rate": 6.011002108737508e-05, + "loss": 0.6909, + "mean_token_accuracy": 0.7878920257091522, + "num_tokens": 179761106.0, + "step": 76290 + }, + { + "epoch": 0.6995507472265518, + "learning_rate": 6.009168423947924e-05, + "loss": 0.6882, + "mean_token_accuracy": 0.7916716039180756, + "num_tokens": 179786240.0, + "step": 76300 + }, + { + "epoch": 0.699642431466031, + "learning_rate": 6.007334739158339e-05, + "loss": 0.6609, + "mean_token_accuracy": 0.7954664885997772, + "num_tokens": 179811970.0, + "step": 76310 + }, + { + "epoch": 0.6997341157055103, + "learning_rate": 6.005501054368754e-05, + "loss": 0.7142, + "mean_token_accuracy": 0.7827772855758667, + "num_tokens": 179836667.0, + "step": 76320 + }, + { + "epoch": 0.6998257999449895, + "learning_rate": 6.00366736957917e-05, + "loss": 0.6555, + "mean_token_accuracy": 0.7956376850605011, + "num_tokens": 179861968.0, + "step": 76330 + }, + { + "epoch": 0.6999174841844686, + "learning_rate": 6.001833684789585e-05, + "loss": 0.6638, + "mean_token_accuracy": 0.7971653342247009, + "num_tokens": 179887636.0, + "step": 76340 + }, + { + "epoch": 0.7000091684239479, + "learning_rate": 6e-05, + "loss": 0.688, + "mean_token_accuracy": 0.785324776172638, + "num_tokens": 179912698.0, + "step": 76350 + }, + { + "epoch": 0.7001008526634271, + "learning_rate": 5.998166315210416e-05, + "loss": 0.6523, + "mean_token_accuracy": 0.7965922951698303, + "num_tokens": 179938140.0, + "step": 76360 + }, + { + "epoch": 0.7001925369029064, + "learning_rate": 5.996332630420831e-05, + "loss": 0.6551, + "mean_token_accuracy": 0.7932762920856475, + "num_tokens": 179963079.0, + "step": 76370 + }, + { + "epoch": 0.7002842211423856, + "learning_rate": 5.9944989456312464e-05, + "loss": 0.6949, + "mean_token_accuracy": 0.7842654764652253, + "num_tokens": 179988743.0, + "step": 76380 + }, + { + "epoch": 0.7003759053818649, + "learning_rate": 5.992665260841661e-05, + "loss": 0.6589, + "mean_token_accuracy": 0.7966576039791107, + "num_tokens": 180014016.0, + "step": 76390 + }, + { + "epoch": 0.7004675896213441, + "learning_rate": 5.9908315760520774e-05, + "loss": 0.6792, + "mean_token_accuracy": 0.7953386723995208, + "num_tokens": 180039818.0, + "step": 76400 + }, + { + "epoch": 0.7005592738608233, + "learning_rate": 5.988997891262492e-05, + "loss": 0.6695, + "mean_token_accuracy": 0.79258491396904, + "num_tokens": 180065228.0, + "step": 76410 + }, + { + "epoch": 0.7006509581003025, + "learning_rate": 5.987164206472907e-05, + "loss": 0.6875, + "mean_token_accuracy": 0.7920036256313324, + "num_tokens": 180090602.0, + "step": 76420 + }, + { + "epoch": 0.7007426423397818, + "learning_rate": 5.985330521683323e-05, + "loss": 0.6319, + "mean_token_accuracy": 0.8041131377220154, + "num_tokens": 180115623.0, + "step": 76430 + }, + { + "epoch": 0.700834326579261, + "learning_rate": 5.983496836893738e-05, + "loss": 0.6781, + "mean_token_accuracy": 0.7869494497776032, + "num_tokens": 180140359.0, + "step": 76440 + }, + { + "epoch": 0.7009260108187403, + "learning_rate": 5.9816631521041534e-05, + "loss": 0.6824, + "mean_token_accuracy": 0.7869329512119293, + "num_tokens": 180164972.0, + "step": 76450 + }, + { + "epoch": 0.7010176950582195, + "learning_rate": 5.979829467314569e-05, + "loss": 0.6601, + "mean_token_accuracy": 0.796118974685669, + "num_tokens": 180189791.0, + "step": 76460 + }, + { + "epoch": 0.7011093792976987, + "learning_rate": 5.9779957825249844e-05, + "loss": 0.6826, + "mean_token_accuracy": 0.7869082808494567, + "num_tokens": 180215349.0, + "step": 76470 + }, + { + "epoch": 0.7012010635371779, + "learning_rate": 5.9761620977353996e-05, + "loss": 0.6826, + "mean_token_accuracy": 0.7972529768943787, + "num_tokens": 180240882.0, + "step": 76480 + }, + { + "epoch": 0.7012927477766572, + "learning_rate": 5.974328412945814e-05, + "loss": 0.6973, + "mean_token_accuracy": 0.7850015044212342, + "num_tokens": 180266371.0, + "step": 76490 + }, + { + "epoch": 0.7013844320161364, + "learning_rate": 5.972494728156231e-05, + "loss": 0.657, + "mean_token_accuracy": 0.7914840102195739, + "num_tokens": 180291410.0, + "step": 76500 + }, + { + "epoch": 0.7014761162556157, + "learning_rate": 5.970661043366645e-05, + "loss": 0.6154, + "mean_token_accuracy": 0.8100368440151214, + "num_tokens": 180317090.0, + "step": 76510 + }, + { + "epoch": 0.7015678004950949, + "learning_rate": 5.9688273585770604e-05, + "loss": 0.6448, + "mean_token_accuracy": 0.8013284623622894, + "num_tokens": 180342333.0, + "step": 76520 + }, + { + "epoch": 0.7016594847345742, + "learning_rate": 5.966993673787476e-05, + "loss": 0.6946, + "mean_token_accuracy": 0.7870315790176392, + "num_tokens": 180367314.0, + "step": 76530 + }, + { + "epoch": 0.7017511689740533, + "learning_rate": 5.9651599889978914e-05, + "loss": 0.6896, + "mean_token_accuracy": 0.7894434034824371, + "num_tokens": 180392770.0, + "step": 76540 + }, + { + "epoch": 0.7018428532135326, + "learning_rate": 5.9633263042083066e-05, + "loss": 0.6748, + "mean_token_accuracy": 0.7907483339309692, + "num_tokens": 180418879.0, + "step": 76550 + }, + { + "epoch": 0.7019345374530118, + "learning_rate": 5.9614926194187225e-05, + "loss": 0.6828, + "mean_token_accuracy": 0.7872988939285278, + "num_tokens": 180444107.0, + "step": 76560 + }, + { + "epoch": 0.7020262216924911, + "learning_rate": 5.9596589346291376e-05, + "loss": 0.684, + "mean_token_accuracy": 0.791980254650116, + "num_tokens": 180469720.0, + "step": 76570 + }, + { + "epoch": 0.7021179059319703, + "learning_rate": 5.957825249839553e-05, + "loss": 0.6655, + "mean_token_accuracy": 0.7936712384223938, + "num_tokens": 180495426.0, + "step": 76580 + }, + { + "epoch": 0.7022095901714496, + "learning_rate": 5.955991565049969e-05, + "loss": 0.6735, + "mean_token_accuracy": 0.794761061668396, + "num_tokens": 180520531.0, + "step": 76590 + }, + { + "epoch": 0.7023012744109287, + "learning_rate": 5.954157880260384e-05, + "loss": 0.6687, + "mean_token_accuracy": 0.7890596449375152, + "num_tokens": 180545814.0, + "step": 76600 + }, + { + "epoch": 0.702392958650408, + "learning_rate": 5.9523241954707984e-05, + "loss": 0.6626, + "mean_token_accuracy": 0.7914606809616089, + "num_tokens": 180570631.0, + "step": 76610 + }, + { + "epoch": 0.7024846428898872, + "learning_rate": 5.9504905106812136e-05, + "loss": 0.6723, + "mean_token_accuracy": 0.7984126508235931, + "num_tokens": 180596049.0, + "step": 76620 + }, + { + "epoch": 0.7025763271293665, + "learning_rate": 5.9486568258916294e-05, + "loss": 0.6636, + "mean_token_accuracy": 0.7984091997146606, + "num_tokens": 180622258.0, + "step": 76630 + }, + { + "epoch": 0.7026680113688457, + "learning_rate": 5.9468231411020446e-05, + "loss": 0.6718, + "mean_token_accuracy": 0.7853006243705749, + "num_tokens": 180646728.0, + "step": 76640 + }, + { + "epoch": 0.702759695608325, + "learning_rate": 5.94498945631246e-05, + "loss": 0.6951, + "mean_token_accuracy": 0.7850263833999633, + "num_tokens": 180671574.0, + "step": 76650 + }, + { + "epoch": 0.7028513798478042, + "learning_rate": 5.943155771522876e-05, + "loss": 0.6799, + "mean_token_accuracy": 0.7914558529853821, + "num_tokens": 180696395.0, + "step": 76660 + }, + { + "epoch": 0.7029430640872834, + "learning_rate": 5.941322086733291e-05, + "loss": 0.7179, + "mean_token_accuracy": 0.781195193529129, + "num_tokens": 180721002.0, + "step": 76670 + }, + { + "epoch": 0.7030347483267626, + "learning_rate": 5.939488401943706e-05, + "loss": 0.6632, + "mean_token_accuracy": 0.7917946457862854, + "num_tokens": 180746339.0, + "step": 76680 + }, + { + "epoch": 0.7031264325662419, + "learning_rate": 5.937654717154122e-05, + "loss": 0.6678, + "mean_token_accuracy": 0.792183643579483, + "num_tokens": 180770717.0, + "step": 76690 + }, + { + "epoch": 0.7032181168057211, + "learning_rate": 5.935821032364537e-05, + "loss": 0.7112, + "mean_token_accuracy": 0.784171599149704, + "num_tokens": 180795691.0, + "step": 76700 + }, + { + "epoch": 0.7033098010452004, + "learning_rate": 5.9339873475749516e-05, + "loss": 0.6619, + "mean_token_accuracy": 0.7923989355564117, + "num_tokens": 180821094.0, + "step": 76710 + }, + { + "epoch": 0.7034014852846796, + "learning_rate": 5.932153662785368e-05, + "loss": 0.6319, + "mean_token_accuracy": 0.8048372387886047, + "num_tokens": 180846700.0, + "step": 76720 + }, + { + "epoch": 0.7034931695241587, + "learning_rate": 5.930319977995783e-05, + "loss": 0.6769, + "mean_token_accuracy": 0.7893557667732238, + "num_tokens": 180872282.0, + "step": 76730 + }, + { + "epoch": 0.703584853763638, + "learning_rate": 5.928486293206198e-05, + "loss": 0.7249, + "mean_token_accuracy": 0.7826806366443634, + "num_tokens": 180897235.0, + "step": 76740 + }, + { + "epoch": 0.7036765380031172, + "learning_rate": 5.926652608416613e-05, + "loss": 0.6778, + "mean_token_accuracy": 0.7904228389263153, + "num_tokens": 180922529.0, + "step": 76750 + }, + { + "epoch": 0.7037682222425965, + "learning_rate": 5.924818923627029e-05, + "loss": 0.6492, + "mean_token_accuracy": 0.7943959832191467, + "num_tokens": 180948432.0, + "step": 76760 + }, + { + "epoch": 0.7038599064820757, + "learning_rate": 5.922985238837444e-05, + "loss": 0.6322, + "mean_token_accuracy": 0.7964687287807465, + "num_tokens": 180973094.0, + "step": 76770 + }, + { + "epoch": 0.703951590721555, + "learning_rate": 5.921151554047859e-05, + "loss": 0.6803, + "mean_token_accuracy": 0.7894576191902161, + "num_tokens": 180997814.0, + "step": 76780 + }, + { + "epoch": 0.7040432749610342, + "learning_rate": 5.919317869258275e-05, + "loss": 0.6803, + "mean_token_accuracy": 0.7830595135688782, + "num_tokens": 181021971.0, + "step": 76790 + }, + { + "epoch": 0.7041349592005134, + "learning_rate": 5.91748418446869e-05, + "loss": 0.6886, + "mean_token_accuracy": 0.7863920331001282, + "num_tokens": 181047177.0, + "step": 76800 + }, + { + "epoch": 0.7042266434399926, + "learning_rate": 5.915650499679105e-05, + "loss": 0.6879, + "mean_token_accuracy": 0.7897522926330567, + "num_tokens": 181072613.0, + "step": 76810 + }, + { + "epoch": 0.7043183276794719, + "learning_rate": 5.9138168148895214e-05, + "loss": 0.7155, + "mean_token_accuracy": 0.7848186373710633, + "num_tokens": 181098545.0, + "step": 76820 + }, + { + "epoch": 0.7044100119189511, + "learning_rate": 5.911983130099936e-05, + "loss": 0.6931, + "mean_token_accuracy": 0.7870139658451081, + "num_tokens": 181123650.0, + "step": 76830 + }, + { + "epoch": 0.7045016961584304, + "learning_rate": 5.910149445310351e-05, + "loss": 0.679, + "mean_token_accuracy": 0.7967150986194611, + "num_tokens": 181148046.0, + "step": 76840 + }, + { + "epoch": 0.7045933803979096, + "learning_rate": 5.9083157605207676e-05, + "loss": 0.6688, + "mean_token_accuracy": 0.793145477771759, + "num_tokens": 181173276.0, + "step": 76850 + }, + { + "epoch": 0.7046850646373888, + "learning_rate": 5.906482075731182e-05, + "loss": 0.6847, + "mean_token_accuracy": 0.7901999592781067, + "num_tokens": 181198838.0, + "step": 76860 + }, + { + "epoch": 0.704776748876868, + "learning_rate": 5.904648390941597e-05, + "loss": 0.6761, + "mean_token_accuracy": 0.7846197009086608, + "num_tokens": 181224476.0, + "step": 76870 + }, + { + "epoch": 0.7048684331163473, + "learning_rate": 5.9028147061520125e-05, + "loss": 0.6622, + "mean_token_accuracy": 0.7943405210971832, + "num_tokens": 181248987.0, + "step": 76880 + }, + { + "epoch": 0.7049601173558265, + "learning_rate": 5.9009810213624284e-05, + "loss": 0.7147, + "mean_token_accuracy": 0.7793645620346069, + "num_tokens": 181274286.0, + "step": 76890 + }, + { + "epoch": 0.7050518015953058, + "learning_rate": 5.8991473365728436e-05, + "loss": 0.6614, + "mean_token_accuracy": 0.7946879148483277, + "num_tokens": 181299549.0, + "step": 76900 + }, + { + "epoch": 0.705143485834785, + "learning_rate": 5.897313651783258e-05, + "loss": 0.7211, + "mean_token_accuracy": 0.7797550737857819, + "num_tokens": 181324757.0, + "step": 76910 + }, + { + "epoch": 0.7052351700742643, + "learning_rate": 5.8954799669936746e-05, + "loss": 0.6767, + "mean_token_accuracy": 0.7889573633670807, + "num_tokens": 181349457.0, + "step": 76920 + }, + { + "epoch": 0.7053268543137434, + "learning_rate": 5.893646282204089e-05, + "loss": 0.6817, + "mean_token_accuracy": 0.7939691424369812, + "num_tokens": 181374695.0, + "step": 76930 + }, + { + "epoch": 0.7054185385532227, + "learning_rate": 5.891812597414504e-05, + "loss": 0.6669, + "mean_token_accuracy": 0.7937139928340912, + "num_tokens": 181400364.0, + "step": 76940 + }, + { + "epoch": 0.7055102227927019, + "learning_rate": 5.889978912624921e-05, + "loss": 0.6947, + "mean_token_accuracy": 0.7926955759525299, + "num_tokens": 181425822.0, + "step": 76950 + }, + { + "epoch": 0.7056019070321812, + "learning_rate": 5.8881452278353354e-05, + "loss": 0.6693, + "mean_token_accuracy": 0.7917500972747803, + "num_tokens": 181451487.0, + "step": 76960 + }, + { + "epoch": 0.7056935912716604, + "learning_rate": 5.8863115430457505e-05, + "loss": 0.7228, + "mean_token_accuracy": 0.7817276835441589, + "num_tokens": 181477328.0, + "step": 76970 + }, + { + "epoch": 0.7057852755111397, + "learning_rate": 5.8844778582561664e-05, + "loss": 0.6799, + "mean_token_accuracy": 0.7889807641506195, + "num_tokens": 181502502.0, + "step": 76980 + }, + { + "epoch": 0.7058769597506188, + "learning_rate": 5.8826441734665816e-05, + "loss": 0.6712, + "mean_token_accuracy": 0.7955949425697326, + "num_tokens": 181528497.0, + "step": 76990 + }, + { + "epoch": 0.7059686439900981, + "learning_rate": 5.880810488676997e-05, + "loss": 0.6782, + "mean_token_accuracy": 0.7896027624607086, + "num_tokens": 181552879.0, + "step": 77000 + }, + { + "epoch": 0.7060603282295773, + "learning_rate": 5.878976803887411e-05, + "loss": 0.6735, + "mean_token_accuracy": 0.7945159912109375, + "num_tokens": 181578229.0, + "step": 77010 + }, + { + "epoch": 0.7061520124690566, + "learning_rate": 5.877143119097828e-05, + "loss": 0.689, + "mean_token_accuracy": 0.791348934173584, + "num_tokens": 181603749.0, + "step": 77020 + }, + { + "epoch": 0.7062436967085358, + "learning_rate": 5.875309434308242e-05, + "loss": 0.6732, + "mean_token_accuracy": 0.7935809016227722, + "num_tokens": 181629104.0, + "step": 77030 + }, + { + "epoch": 0.7063353809480151, + "learning_rate": 5.8734757495186575e-05, + "loss": 0.6819, + "mean_token_accuracy": 0.7947469830513001, + "num_tokens": 181653839.0, + "step": 77040 + }, + { + "epoch": 0.7064270651874943, + "learning_rate": 5.871642064729074e-05, + "loss": 0.7116, + "mean_token_accuracy": 0.7810812950134277, + "num_tokens": 181679173.0, + "step": 77050 + }, + { + "epoch": 0.7065187494269735, + "learning_rate": 5.8698083799394886e-05, + "loss": 0.6704, + "mean_token_accuracy": 0.7936798632144928, + "num_tokens": 181704820.0, + "step": 77060 + }, + { + "epoch": 0.7066104336664527, + "learning_rate": 5.867974695149904e-05, + "loss": 0.6719, + "mean_token_accuracy": 0.7947412610054017, + "num_tokens": 181729585.0, + "step": 77070 + }, + { + "epoch": 0.706702117905932, + "learning_rate": 5.8661410103603196e-05, + "loss": 0.6822, + "mean_token_accuracy": 0.789141708612442, + "num_tokens": 181754007.0, + "step": 77080 + }, + { + "epoch": 0.7067938021454112, + "learning_rate": 5.864307325570735e-05, + "loss": 0.6848, + "mean_token_accuracy": 0.7885053396224976, + "num_tokens": 181779081.0, + "step": 77090 + }, + { + "epoch": 0.7068854863848905, + "learning_rate": 5.86247364078115e-05, + "loss": 0.6794, + "mean_token_accuracy": 0.7914442479610443, + "num_tokens": 181804143.0, + "step": 77100 + }, + { + "epoch": 0.7069771706243697, + "learning_rate": 5.8606399559915645e-05, + "loss": 0.6618, + "mean_token_accuracy": 0.7903600037097931, + "num_tokens": 181829360.0, + "step": 77110 + }, + { + "epoch": 0.7070688548638489, + "learning_rate": 5.858806271201981e-05, + "loss": 0.6787, + "mean_token_accuracy": 0.7898567736148834, + "num_tokens": 181854744.0, + "step": 77120 + }, + { + "epoch": 0.7071605391033281, + "learning_rate": 5.8569725864123956e-05, + "loss": 0.6817, + "mean_token_accuracy": 0.789820522069931, + "num_tokens": 181878917.0, + "step": 77130 + }, + { + "epoch": 0.7072522233428074, + "learning_rate": 5.855138901622811e-05, + "loss": 0.6598, + "mean_token_accuracy": 0.796710067987442, + "num_tokens": 181904273.0, + "step": 77140 + }, + { + "epoch": 0.7073439075822866, + "learning_rate": 5.853305216833227e-05, + "loss": 0.663, + "mean_token_accuracy": 0.7935916244983673, + "num_tokens": 181929692.0, + "step": 77150 + }, + { + "epoch": 0.7074355918217659, + "learning_rate": 5.851471532043642e-05, + "loss": 0.6619, + "mean_token_accuracy": 0.7959802508354187, + "num_tokens": 181954993.0, + "step": 77160 + }, + { + "epoch": 0.7075272760612451, + "learning_rate": 5.849637847254057e-05, + "loss": 0.6688, + "mean_token_accuracy": 0.7960519790649414, + "num_tokens": 181979921.0, + "step": 77170 + }, + { + "epoch": 0.7076189603007244, + "learning_rate": 5.847804162464473e-05, + "loss": 0.6837, + "mean_token_accuracy": 0.794447660446167, + "num_tokens": 182004918.0, + "step": 77180 + }, + { + "epoch": 0.7077106445402035, + "learning_rate": 5.845970477674888e-05, + "loss": 0.6876, + "mean_token_accuracy": 0.784761905670166, + "num_tokens": 182029610.0, + "step": 77190 + }, + { + "epoch": 0.7078023287796827, + "learning_rate": 5.844136792885303e-05, + "loss": 0.6725, + "mean_token_accuracy": 0.7931979894638062, + "num_tokens": 182054775.0, + "step": 77200 + }, + { + "epoch": 0.707894013019162, + "learning_rate": 5.842303108095719e-05, + "loss": 0.7529, + "mean_token_accuracy": 0.7726520478725434, + "num_tokens": 182079881.0, + "step": 77210 + }, + { + "epoch": 0.7079856972586412, + "learning_rate": 5.840469423306134e-05, + "loss": 0.6818, + "mean_token_accuracy": 0.7893115043640136, + "num_tokens": 182105885.0, + "step": 77220 + }, + { + "epoch": 0.7080773814981205, + "learning_rate": 5.838635738516549e-05, + "loss": 0.7009, + "mean_token_accuracy": 0.7863038897514343, + "num_tokens": 182130750.0, + "step": 77230 + }, + { + "epoch": 0.7081690657375997, + "learning_rate": 5.836802053726964e-05, + "loss": 0.7407, + "mean_token_accuracy": 0.7787288665771485, + "num_tokens": 182155639.0, + "step": 77240 + }, + { + "epoch": 0.7082607499770789, + "learning_rate": 5.8349683689373805e-05, + "loss": 0.664, + "mean_token_accuracy": 0.7939791321754456, + "num_tokens": 182179991.0, + "step": 77250 + }, + { + "epoch": 0.7083524342165581, + "learning_rate": 5.833134684147795e-05, + "loss": 0.6617, + "mean_token_accuracy": 0.7917009890079498, + "num_tokens": 182204313.0, + "step": 77260 + }, + { + "epoch": 0.7084441184560374, + "learning_rate": 5.83130099935821e-05, + "loss": 0.6856, + "mean_token_accuracy": 0.7876560926437378, + "num_tokens": 182228841.0, + "step": 77270 + }, + { + "epoch": 0.7085358026955166, + "learning_rate": 5.829467314568626e-05, + "loss": 0.7318, + "mean_token_accuracy": 0.7744341731071472, + "num_tokens": 182253508.0, + "step": 77280 + }, + { + "epoch": 0.7086274869349959, + "learning_rate": 5.827633629779041e-05, + "loss": 0.7052, + "mean_token_accuracy": 0.7833770155906677, + "num_tokens": 182278515.0, + "step": 77290 + }, + { + "epoch": 0.7087191711744751, + "learning_rate": 5.8257999449894564e-05, + "loss": 0.6478, + "mean_token_accuracy": 0.7999937832355499, + "num_tokens": 182304055.0, + "step": 77300 + }, + { + "epoch": 0.7088108554139544, + "learning_rate": 5.823966260199872e-05, + "loss": 0.6582, + "mean_token_accuracy": 0.7930777072906494, + "num_tokens": 182329142.0, + "step": 77310 + }, + { + "epoch": 0.7089025396534335, + "learning_rate": 5.8221325754102875e-05, + "loss": 0.6816, + "mean_token_accuracy": 0.7900965869426727, + "num_tokens": 182353892.0, + "step": 77320 + }, + { + "epoch": 0.7089942238929128, + "learning_rate": 5.820298890620702e-05, + "loss": 0.6786, + "mean_token_accuracy": 0.7906683802604675, + "num_tokens": 182378853.0, + "step": 77330 + }, + { + "epoch": 0.709085908132392, + "learning_rate": 5.8184652058311185e-05, + "loss": 0.6946, + "mean_token_accuracy": 0.7840655148029327, + "num_tokens": 182404074.0, + "step": 77340 + }, + { + "epoch": 0.7091775923718713, + "learning_rate": 5.816631521041534e-05, + "loss": 0.6715, + "mean_token_accuracy": 0.7909890592098237, + "num_tokens": 182429726.0, + "step": 77350 + }, + { + "epoch": 0.7092692766113505, + "learning_rate": 5.814797836251948e-05, + "loss": 0.6804, + "mean_token_accuracy": 0.7889102041721344, + "num_tokens": 182455672.0, + "step": 77360 + }, + { + "epoch": 0.7093609608508298, + "learning_rate": 5.8129641514623634e-05, + "loss": 0.6953, + "mean_token_accuracy": 0.7895851194858551, + "num_tokens": 182480786.0, + "step": 77370 + }, + { + "epoch": 0.709452645090309, + "learning_rate": 5.811130466672779e-05, + "loss": 0.6768, + "mean_token_accuracy": 0.7942793130874634, + "num_tokens": 182506078.0, + "step": 77380 + }, + { + "epoch": 0.7095443293297882, + "learning_rate": 5.8092967818831945e-05, + "loss": 0.6555, + "mean_token_accuracy": 0.7945311725139618, + "num_tokens": 182531261.0, + "step": 77390 + }, + { + "epoch": 0.7096360135692674, + "learning_rate": 5.80746309709361e-05, + "loss": 0.651, + "mean_token_accuracy": 0.7952611863613128, + "num_tokens": 182556398.0, + "step": 77400 + }, + { + "epoch": 0.7097276978087467, + "learning_rate": 5.8056294123040255e-05, + "loss": 0.6794, + "mean_token_accuracy": 0.7877298772335053, + "num_tokens": 182581226.0, + "step": 77410 + }, + { + "epoch": 0.7098193820482259, + "learning_rate": 5.803795727514441e-05, + "loss": 0.6868, + "mean_token_accuracy": 0.7852868854999542, + "num_tokens": 182606563.0, + "step": 77420 + }, + { + "epoch": 0.7099110662877052, + "learning_rate": 5.801962042724855e-05, + "loss": 0.6883, + "mean_token_accuracy": 0.7888477265834808, + "num_tokens": 182631515.0, + "step": 77430 + }, + { + "epoch": 0.7100027505271844, + "learning_rate": 5.800128357935272e-05, + "loss": 0.7187, + "mean_token_accuracy": 0.787151426076889, + "num_tokens": 182656070.0, + "step": 77440 + }, + { + "epoch": 0.7100944347666636, + "learning_rate": 5.798294673145687e-05, + "loss": 0.6444, + "mean_token_accuracy": 0.7948240578174591, + "num_tokens": 182681575.0, + "step": 77450 + }, + { + "epoch": 0.7101861190061428, + "learning_rate": 5.7964609883561015e-05, + "loss": 0.6702, + "mean_token_accuracy": 0.7921246230602265, + "num_tokens": 182707205.0, + "step": 77460 + }, + { + "epoch": 0.7102778032456221, + "learning_rate": 5.794627303566518e-05, + "loss": 0.6597, + "mean_token_accuracy": 0.7928208768367767, + "num_tokens": 182732143.0, + "step": 77470 + }, + { + "epoch": 0.7103694874851013, + "learning_rate": 5.7927936187769325e-05, + "loss": 0.6765, + "mean_token_accuracy": 0.7914460361003876, + "num_tokens": 182757778.0, + "step": 77480 + }, + { + "epoch": 0.7104611717245806, + "learning_rate": 5.790959933987348e-05, + "loss": 0.6648, + "mean_token_accuracy": 0.7961377739906311, + "num_tokens": 182782644.0, + "step": 77490 + }, + { + "epoch": 0.7105528559640598, + "learning_rate": 5.789126249197763e-05, + "loss": 0.6614, + "mean_token_accuracy": 0.7947397768497467, + "num_tokens": 182807805.0, + "step": 77500 + }, + { + "epoch": 0.7106445402035391, + "learning_rate": 5.787292564408179e-05, + "loss": 0.6889, + "mean_token_accuracy": 0.7911662220954895, + "num_tokens": 182833562.0, + "step": 77510 + }, + { + "epoch": 0.7107362244430182, + "learning_rate": 5.785458879618594e-05, + "loss": 0.6902, + "mean_token_accuracy": 0.7831215023994446, + "num_tokens": 182859458.0, + "step": 77520 + }, + { + "epoch": 0.7108279086824975, + "learning_rate": 5.7836251948290085e-05, + "loss": 0.6976, + "mean_token_accuracy": 0.7894893825054169, + "num_tokens": 182884385.0, + "step": 77530 + }, + { + "epoch": 0.7109195929219767, + "learning_rate": 5.781791510039425e-05, + "loss": 0.6462, + "mean_token_accuracy": 0.7979496419429779, + "num_tokens": 182909871.0, + "step": 77540 + }, + { + "epoch": 0.711011277161456, + "learning_rate": 5.77995782524984e-05, + "loss": 0.7004, + "mean_token_accuracy": 0.7869316816329956, + "num_tokens": 182935038.0, + "step": 77550 + }, + { + "epoch": 0.7111029614009352, + "learning_rate": 5.778124140460255e-05, + "loss": 0.6854, + "mean_token_accuracy": 0.7915327310562134, + "num_tokens": 182960594.0, + "step": 77560 + }, + { + "epoch": 0.7111946456404145, + "learning_rate": 5.776290455670671e-05, + "loss": 0.6172, + "mean_token_accuracy": 0.8074375748634338, + "num_tokens": 182985612.0, + "step": 77570 + }, + { + "epoch": 0.7112863298798936, + "learning_rate": 5.774456770881086e-05, + "loss": 0.6528, + "mean_token_accuracy": 0.7955219149589539, + "num_tokens": 183010303.0, + "step": 77580 + }, + { + "epoch": 0.7113780141193728, + "learning_rate": 5.772623086091501e-05, + "loss": 0.6945, + "mean_token_accuracy": 0.789950567483902, + "num_tokens": 183035037.0, + "step": 77590 + }, + { + "epoch": 0.7114696983588521, + "learning_rate": 5.770789401301917e-05, + "loss": 0.6861, + "mean_token_accuracy": 0.7843886494636536, + "num_tokens": 183059573.0, + "step": 77600 + }, + { + "epoch": 0.7115613825983313, + "learning_rate": 5.768955716512332e-05, + "loss": 0.6424, + "mean_token_accuracy": 0.8002339243888855, + "num_tokens": 183084243.0, + "step": 77610 + }, + { + "epoch": 0.7116530668378106, + "learning_rate": 5.767122031722747e-05, + "loss": 0.712, + "mean_token_accuracy": 0.7875123262405396, + "num_tokens": 183110146.0, + "step": 77620 + }, + { + "epoch": 0.7117447510772899, + "learning_rate": 5.765288346933162e-05, + "loss": 0.6586, + "mean_token_accuracy": 0.7953888654708863, + "num_tokens": 183135299.0, + "step": 77630 + }, + { + "epoch": 0.7118364353167691, + "learning_rate": 5.763454662143578e-05, + "loss": 0.6636, + "mean_token_accuracy": 0.7930649042129516, + "num_tokens": 183160040.0, + "step": 77640 + }, + { + "epoch": 0.7119281195562482, + "learning_rate": 5.7616209773539934e-05, + "loss": 0.6884, + "mean_token_accuracy": 0.7891636252403259, + "num_tokens": 183184777.0, + "step": 77650 + }, + { + "epoch": 0.7120198037957275, + "learning_rate": 5.759787292564408e-05, + "loss": 0.6578, + "mean_token_accuracy": 0.7926559567451477, + "num_tokens": 183210093.0, + "step": 77660 + }, + { + "epoch": 0.7121114880352067, + "learning_rate": 5.7579536077748245e-05, + "loss": 0.661, + "mean_token_accuracy": 0.7948283314704895, + "num_tokens": 183235845.0, + "step": 77670 + }, + { + "epoch": 0.712203172274686, + "learning_rate": 5.756119922985239e-05, + "loss": 0.6649, + "mean_token_accuracy": 0.7924795091152191, + "num_tokens": 183261107.0, + "step": 77680 + }, + { + "epoch": 0.7122948565141652, + "learning_rate": 5.754286238195654e-05, + "loss": 0.6692, + "mean_token_accuracy": 0.7879079580307007, + "num_tokens": 183286263.0, + "step": 77690 + }, + { + "epoch": 0.7123865407536445, + "learning_rate": 5.75245255340607e-05, + "loss": 0.6687, + "mean_token_accuracy": 0.7926979243755341, + "num_tokens": 183311998.0, + "step": 77700 + }, + { + "epoch": 0.7124782249931236, + "learning_rate": 5.750618868616485e-05, + "loss": 0.7008, + "mean_token_accuracy": 0.7857622802257538, + "num_tokens": 183336922.0, + "step": 77710 + }, + { + "epoch": 0.7125699092326029, + "learning_rate": 5.7487851838269004e-05, + "loss": 0.7156, + "mean_token_accuracy": 0.7862915635108948, + "num_tokens": 183362223.0, + "step": 77720 + }, + { + "epoch": 0.7126615934720821, + "learning_rate": 5.746951499037315e-05, + "loss": 0.71, + "mean_token_accuracy": 0.7855953216552735, + "num_tokens": 183386996.0, + "step": 77730 + }, + { + "epoch": 0.7127532777115614, + "learning_rate": 5.7451178142477314e-05, + "loss": 0.6739, + "mean_token_accuracy": 0.7907623469829559, + "num_tokens": 183411714.0, + "step": 77740 + }, + { + "epoch": 0.7128449619510406, + "learning_rate": 5.7432841294581466e-05, + "loss": 0.6828, + "mean_token_accuracy": 0.786265766620636, + "num_tokens": 183436531.0, + "step": 77750 + }, + { + "epoch": 0.7129366461905199, + "learning_rate": 5.741450444668561e-05, + "loss": 0.6642, + "mean_token_accuracy": 0.7964664816856384, + "num_tokens": 183461573.0, + "step": 77760 + }, + { + "epoch": 0.7130283304299991, + "learning_rate": 5.739616759878978e-05, + "loss": 0.6899, + "mean_token_accuracy": 0.7901533544063568, + "num_tokens": 183487012.0, + "step": 77770 + }, + { + "epoch": 0.7131200146694783, + "learning_rate": 5.737783075089392e-05, + "loss": 0.6765, + "mean_token_accuracy": 0.7908352613449097, + "num_tokens": 183512918.0, + "step": 77780 + }, + { + "epoch": 0.7132116989089575, + "learning_rate": 5.7359493902998074e-05, + "loss": 0.6814, + "mean_token_accuracy": 0.7902816355228424, + "num_tokens": 183538668.0, + "step": 77790 + }, + { + "epoch": 0.7133033831484368, + "learning_rate": 5.734115705510223e-05, + "loss": 0.6658, + "mean_token_accuracy": 0.7939606606960297, + "num_tokens": 183563237.0, + "step": 77800 + }, + { + "epoch": 0.713395067387916, + "learning_rate": 5.7322820207206384e-05, + "loss": 0.6865, + "mean_token_accuracy": 0.7885273933410645, + "num_tokens": 183588836.0, + "step": 77810 + }, + { + "epoch": 0.7134867516273953, + "learning_rate": 5.7304483359310536e-05, + "loss": 0.7152, + "mean_token_accuracy": 0.7769215404987335, + "num_tokens": 183613841.0, + "step": 77820 + }, + { + "epoch": 0.7135784358668745, + "learning_rate": 5.7286146511414695e-05, + "loss": 0.6771, + "mean_token_accuracy": 0.7876941502094269, + "num_tokens": 183638946.0, + "step": 77830 + }, + { + "epoch": 0.7136701201063537, + "learning_rate": 5.726780966351885e-05, + "loss": 0.6726, + "mean_token_accuracy": 0.7927168607711792, + "num_tokens": 183664240.0, + "step": 77840 + }, + { + "epoch": 0.7137618043458329, + "learning_rate": 5.7249472815623e-05, + "loss": 0.6796, + "mean_token_accuracy": 0.7934220433235168, + "num_tokens": 183689042.0, + "step": 77850 + }, + { + "epoch": 0.7138534885853122, + "learning_rate": 5.7231135967727144e-05, + "loss": 0.6972, + "mean_token_accuracy": 0.7839462220668793, + "num_tokens": 183713691.0, + "step": 77860 + }, + { + "epoch": 0.7139451728247914, + "learning_rate": 5.721279911983131e-05, + "loss": 0.6963, + "mean_token_accuracy": 0.7842570841312408, + "num_tokens": 183739332.0, + "step": 77870 + }, + { + "epoch": 0.7140368570642707, + "learning_rate": 5.7194462271935454e-05, + "loss": 0.6864, + "mean_token_accuracy": 0.7891451597213746, + "num_tokens": 183763411.0, + "step": 77880 + }, + { + "epoch": 0.7141285413037499, + "learning_rate": 5.7176125424039606e-05, + "loss": 0.6821, + "mean_token_accuracy": 0.7885421097278595, + "num_tokens": 183789127.0, + "step": 77890 + }, + { + "epoch": 0.7142202255432292, + "learning_rate": 5.7157788576143765e-05, + "loss": 0.6711, + "mean_token_accuracy": 0.7992440283298492, + "num_tokens": 183813609.0, + "step": 77900 + }, + { + "epoch": 0.7143119097827083, + "learning_rate": 5.7139451728247916e-05, + "loss": 0.6896, + "mean_token_accuracy": 0.792653614282608, + "num_tokens": 183839326.0, + "step": 77910 + }, + { + "epoch": 0.7144035940221876, + "learning_rate": 5.712111488035207e-05, + "loss": 0.6584, + "mean_token_accuracy": 0.7985167622566223, + "num_tokens": 183864306.0, + "step": 77920 + }, + { + "epoch": 0.7144952782616668, + "learning_rate": 5.710277803245623e-05, + "loss": 0.6647, + "mean_token_accuracy": 0.7934771120548249, + "num_tokens": 183888814.0, + "step": 77930 + }, + { + "epoch": 0.7145869625011461, + "learning_rate": 5.708444118456038e-05, + "loss": 0.6897, + "mean_token_accuracy": 0.7820202767848968, + "num_tokens": 183913876.0, + "step": 77940 + }, + { + "epoch": 0.7146786467406253, + "learning_rate": 5.706610433666453e-05, + "loss": 0.6741, + "mean_token_accuracy": 0.7928056299686432, + "num_tokens": 183940439.0, + "step": 77950 + }, + { + "epoch": 0.7147703309801046, + "learning_rate": 5.704776748876869e-05, + "loss": 0.6822, + "mean_token_accuracy": 0.7908152997493744, + "num_tokens": 183965069.0, + "step": 77960 + }, + { + "epoch": 0.7148620152195837, + "learning_rate": 5.702943064087284e-05, + "loss": 0.6795, + "mean_token_accuracy": 0.788107693195343, + "num_tokens": 183990839.0, + "step": 77970 + }, + { + "epoch": 0.714953699459063, + "learning_rate": 5.7011093792976986e-05, + "loss": 0.6618, + "mean_token_accuracy": 0.7950737059116364, + "num_tokens": 184016216.0, + "step": 77980 + }, + { + "epoch": 0.7150453836985422, + "learning_rate": 5.699275694508114e-05, + "loss": 0.6588, + "mean_token_accuracy": 0.7969727396965027, + "num_tokens": 184041948.0, + "step": 77990 + }, + { + "epoch": 0.7151370679380215, + "learning_rate": 5.69744200971853e-05, + "loss": 0.6799, + "mean_token_accuracy": 0.7882644653320312, + "num_tokens": 184067725.0, + "step": 78000 + }, + { + "epoch": 0.7152287521775007, + "learning_rate": 5.695608324928945e-05, + "loss": 0.6748, + "mean_token_accuracy": 0.7901932060718536, + "num_tokens": 184093110.0, + "step": 78010 + }, + { + "epoch": 0.71532043641698, + "learning_rate": 5.69377464013936e-05, + "loss": 0.6965, + "mean_token_accuracy": 0.7816961944103241, + "num_tokens": 184118664.0, + "step": 78020 + }, + { + "epoch": 0.7154121206564592, + "learning_rate": 5.691940955349776e-05, + "loss": 0.6699, + "mean_token_accuracy": 0.7908800780773163, + "num_tokens": 184144459.0, + "step": 78030 + }, + { + "epoch": 0.7155038048959383, + "learning_rate": 5.690107270560191e-05, + "loss": 0.6561, + "mean_token_accuracy": 0.7967715203762055, + "num_tokens": 184170559.0, + "step": 78040 + }, + { + "epoch": 0.7155954891354176, + "learning_rate": 5.688273585770606e-05, + "loss": 0.6547, + "mean_token_accuracy": 0.7976432323455811, + "num_tokens": 184195970.0, + "step": 78050 + }, + { + "epoch": 0.7156871733748968, + "learning_rate": 5.686439900981022e-05, + "loss": 0.6971, + "mean_token_accuracy": 0.7896312355995179, + "num_tokens": 184221762.0, + "step": 78060 + }, + { + "epoch": 0.7157788576143761, + "learning_rate": 5.6846062161914373e-05, + "loss": 0.6806, + "mean_token_accuracy": 0.7902872085571289, + "num_tokens": 184246845.0, + "step": 78070 + }, + { + "epoch": 0.7158705418538553, + "learning_rate": 5.682772531401852e-05, + "loss": 0.6844, + "mean_token_accuracy": 0.7874055624008178, + "num_tokens": 184271935.0, + "step": 78080 + }, + { + "epoch": 0.7159622260933346, + "learning_rate": 5.6809388466122684e-05, + "loss": 0.6831, + "mean_token_accuracy": 0.7964799761772156, + "num_tokens": 184296852.0, + "step": 78090 + }, + { + "epoch": 0.7160539103328137, + "learning_rate": 5.679105161822683e-05, + "loss": 0.6495, + "mean_token_accuracy": 0.7958796322345734, + "num_tokens": 184322161.0, + "step": 78100 + }, + { + "epoch": 0.716145594572293, + "learning_rate": 5.677271477033098e-05, + "loss": 0.6727, + "mean_token_accuracy": 0.7924707174301148, + "num_tokens": 184346686.0, + "step": 78110 + }, + { + "epoch": 0.7162372788117722, + "learning_rate": 5.675437792243513e-05, + "loss": 0.7045, + "mean_token_accuracy": 0.7871766507625579, + "num_tokens": 184371236.0, + "step": 78120 + }, + { + "epoch": 0.7163289630512515, + "learning_rate": 5.673604107453929e-05, + "loss": 0.678, + "mean_token_accuracy": 0.7908380270004273, + "num_tokens": 184396549.0, + "step": 78130 + }, + { + "epoch": 0.7164206472907307, + "learning_rate": 5.671770422664344e-05, + "loss": 0.739, + "mean_token_accuracy": 0.7799354910850524, + "num_tokens": 184422153.0, + "step": 78140 + }, + { + "epoch": 0.71651233153021, + "learning_rate": 5.6699367378747595e-05, + "loss": 0.6654, + "mean_token_accuracy": 0.7889452934265136, + "num_tokens": 184447079.0, + "step": 78150 + }, + { + "epoch": 0.7166040157696892, + "learning_rate": 5.6681030530851754e-05, + "loss": 0.6541, + "mean_token_accuracy": 0.8021519839763641, + "num_tokens": 184471782.0, + "step": 78160 + }, + { + "epoch": 0.7166957000091684, + "learning_rate": 5.6662693682955906e-05, + "loss": 0.6971, + "mean_token_accuracy": 0.790956997871399, + "num_tokens": 184496885.0, + "step": 78170 + }, + { + "epoch": 0.7167873842486476, + "learning_rate": 5.664435683506005e-05, + "loss": 0.7147, + "mean_token_accuracy": 0.7888283967971802, + "num_tokens": 184521899.0, + "step": 78180 + }, + { + "epoch": 0.7168790684881269, + "learning_rate": 5.6626019987164216e-05, + "loss": 0.6686, + "mean_token_accuracy": 0.7869354009628295, + "num_tokens": 184546847.0, + "step": 78190 + }, + { + "epoch": 0.7169707527276061, + "learning_rate": 5.660768313926836e-05, + "loss": 0.6797, + "mean_token_accuracy": 0.7971076250076294, + "num_tokens": 184571856.0, + "step": 78200 + }, + { + "epoch": 0.7170624369670854, + "learning_rate": 5.658934629137251e-05, + "loss": 0.654, + "mean_token_accuracy": 0.7961293399333954, + "num_tokens": 184596631.0, + "step": 78210 + }, + { + "epoch": 0.7171541212065646, + "learning_rate": 5.6571009443476665e-05, + "loss": 0.6728, + "mean_token_accuracy": 0.7975492119789124, + "num_tokens": 184621829.0, + "step": 78220 + }, + { + "epoch": 0.7172458054460438, + "learning_rate": 5.6552672595580824e-05, + "loss": 0.6894, + "mean_token_accuracy": 0.7944309294223786, + "num_tokens": 184646998.0, + "step": 78230 + }, + { + "epoch": 0.717337489685523, + "learning_rate": 5.6534335747684976e-05, + "loss": 0.6811, + "mean_token_accuracy": 0.794684249162674, + "num_tokens": 184671729.0, + "step": 78240 + }, + { + "epoch": 0.7174291739250023, + "learning_rate": 5.651599889978913e-05, + "loss": 0.6638, + "mean_token_accuracy": 0.7963333606719971, + "num_tokens": 184696035.0, + "step": 78250 + }, + { + "epoch": 0.7175208581644815, + "learning_rate": 5.6497662051893286e-05, + "loss": 0.6787, + "mean_token_accuracy": 0.7910999178886413, + "num_tokens": 184721316.0, + "step": 78260 + }, + { + "epoch": 0.7176125424039608, + "learning_rate": 5.647932520399744e-05, + "loss": 0.6586, + "mean_token_accuracy": 0.797629326581955, + "num_tokens": 184745371.0, + "step": 78270 + }, + { + "epoch": 0.71770422664344, + "learning_rate": 5.646098835610158e-05, + "loss": 0.6686, + "mean_token_accuracy": 0.7965006291866302, + "num_tokens": 184770817.0, + "step": 78280 + }, + { + "epoch": 0.7177959108829193, + "learning_rate": 5.644265150820575e-05, + "loss": 0.6872, + "mean_token_accuracy": 0.784556770324707, + "num_tokens": 184796011.0, + "step": 78290 + }, + { + "epoch": 0.7178875951223984, + "learning_rate": 5.6424314660309894e-05, + "loss": 0.6748, + "mean_token_accuracy": 0.7958771646022796, + "num_tokens": 184821089.0, + "step": 78300 + }, + { + "epoch": 0.7179792793618777, + "learning_rate": 5.6405977812414045e-05, + "loss": 0.7017, + "mean_token_accuracy": 0.7866156160831451, + "num_tokens": 184845931.0, + "step": 78310 + }, + { + "epoch": 0.7180709636013569, + "learning_rate": 5.6387640964518204e-05, + "loss": 0.6559, + "mean_token_accuracy": 0.7917865931987762, + "num_tokens": 184871315.0, + "step": 78320 + }, + { + "epoch": 0.7181626478408362, + "learning_rate": 5.6369304116622356e-05, + "loss": 0.6518, + "mean_token_accuracy": 0.7963665962219239, + "num_tokens": 184896598.0, + "step": 78330 + }, + { + "epoch": 0.7182543320803154, + "learning_rate": 5.635096726872651e-05, + "loss": 0.6603, + "mean_token_accuracy": 0.7953488826751709, + "num_tokens": 184922270.0, + "step": 78340 + }, + { + "epoch": 0.7183460163197947, + "learning_rate": 5.633263042083066e-05, + "loss": 0.684, + "mean_token_accuracy": 0.7936093211174011, + "num_tokens": 184947628.0, + "step": 78350 + }, + { + "epoch": 0.7184377005592738, + "learning_rate": 5.631429357293482e-05, + "loss": 0.691, + "mean_token_accuracy": 0.7842152416706085, + "num_tokens": 184972995.0, + "step": 78360 + }, + { + "epoch": 0.7185293847987531, + "learning_rate": 5.629595672503897e-05, + "loss": 0.6555, + "mean_token_accuracy": 0.7920524537563324, + "num_tokens": 184998223.0, + "step": 78370 + }, + { + "epoch": 0.7186210690382323, + "learning_rate": 5.6277619877143115e-05, + "loss": 0.6673, + "mean_token_accuracy": 0.7891258299350739, + "num_tokens": 185023009.0, + "step": 78380 + }, + { + "epoch": 0.7187127532777116, + "learning_rate": 5.625928302924728e-05, + "loss": 0.7255, + "mean_token_accuracy": 0.7829273462295532, + "num_tokens": 185048043.0, + "step": 78390 + }, + { + "epoch": 0.7188044375171908, + "learning_rate": 5.6240946181351426e-05, + "loss": 0.7108, + "mean_token_accuracy": 0.7833603918552399, + "num_tokens": 185072602.0, + "step": 78400 + }, + { + "epoch": 0.7188961217566701, + "learning_rate": 5.622260933345558e-05, + "loss": 0.6909, + "mean_token_accuracy": 0.7880420744419098, + "num_tokens": 185097881.0, + "step": 78410 + }, + { + "epoch": 0.7189878059961493, + "learning_rate": 5.6204272485559736e-05, + "loss": 0.6747, + "mean_token_accuracy": 0.7878067791461945, + "num_tokens": 185122978.0, + "step": 78420 + }, + { + "epoch": 0.7190794902356284, + "learning_rate": 5.618593563766389e-05, + "loss": 0.6386, + "mean_token_accuracy": 0.8035356938838959, + "num_tokens": 185148717.0, + "step": 78430 + }, + { + "epoch": 0.7191711744751077, + "learning_rate": 5.616759878976804e-05, + "loss": 0.6618, + "mean_token_accuracy": 0.7942996501922608, + "num_tokens": 185174113.0, + "step": 78440 + }, + { + "epoch": 0.719262858714587, + "learning_rate": 5.61492619418722e-05, + "loss": 0.6626, + "mean_token_accuracy": 0.7976067721843719, + "num_tokens": 185199948.0, + "step": 78450 + }, + { + "epoch": 0.7193545429540662, + "learning_rate": 5.613092509397635e-05, + "loss": 0.6354, + "mean_token_accuracy": 0.8027196645736694, + "num_tokens": 185225238.0, + "step": 78460 + }, + { + "epoch": 0.7194462271935455, + "learning_rate": 5.61125882460805e-05, + "loss": 0.6328, + "mean_token_accuracy": 0.7983404517173767, + "num_tokens": 185249699.0, + "step": 78470 + }, + { + "epoch": 0.7195379114330247, + "learning_rate": 5.609425139818465e-05, + "loss": 0.6722, + "mean_token_accuracy": 0.7945112943649292, + "num_tokens": 185274338.0, + "step": 78480 + }, + { + "epoch": 0.7196295956725038, + "learning_rate": 5.607591455028881e-05, + "loss": 0.6664, + "mean_token_accuracy": 0.7904851019382477, + "num_tokens": 185300034.0, + "step": 78490 + }, + { + "epoch": 0.7197212799119831, + "learning_rate": 5.605757770239296e-05, + "loss": 0.6707, + "mean_token_accuracy": 0.7888002574443818, + "num_tokens": 185324876.0, + "step": 78500 + }, + { + "epoch": 0.7198129641514623, + "learning_rate": 5.603924085449711e-05, + "loss": 0.6407, + "mean_token_accuracy": 0.8010428786277771, + "num_tokens": 185349660.0, + "step": 78510 + }, + { + "epoch": 0.7199046483909416, + "learning_rate": 5.602090400660127e-05, + "loss": 0.7143, + "mean_token_accuracy": 0.786019253730774, + "num_tokens": 185374978.0, + "step": 78520 + }, + { + "epoch": 0.7199963326304208, + "learning_rate": 5.600256715870542e-05, + "loss": 0.6712, + "mean_token_accuracy": 0.7957077205181122, + "num_tokens": 185398963.0, + "step": 78530 + }, + { + "epoch": 0.7200880168699001, + "learning_rate": 5.598423031080957e-05, + "loss": 0.6747, + "mean_token_accuracy": 0.7959294199943543, + "num_tokens": 185424009.0, + "step": 78540 + }, + { + "epoch": 0.7201797011093793, + "learning_rate": 5.596589346291373e-05, + "loss": 0.6583, + "mean_token_accuracy": 0.7982489109039307, + "num_tokens": 185448764.0, + "step": 78550 + }, + { + "epoch": 0.7202713853488585, + "learning_rate": 5.594755661501788e-05, + "loss": 0.6693, + "mean_token_accuracy": 0.7920622050762176, + "num_tokens": 185473983.0, + "step": 78560 + }, + { + "epoch": 0.7203630695883377, + "learning_rate": 5.5929219767122035e-05, + "loss": 0.6775, + "mean_token_accuracy": 0.7899169385433197, + "num_tokens": 185499079.0, + "step": 78570 + }, + { + "epoch": 0.720454753827817, + "learning_rate": 5.591088291922619e-05, + "loss": 0.6844, + "mean_token_accuracy": 0.7954796433448792, + "num_tokens": 185524004.0, + "step": 78580 + }, + { + "epoch": 0.7205464380672962, + "learning_rate": 5.5892546071330345e-05, + "loss": 0.6807, + "mean_token_accuracy": 0.7902134656906128, + "num_tokens": 185549231.0, + "step": 78590 + }, + { + "epoch": 0.7206381223067755, + "learning_rate": 5.587420922343449e-05, + "loss": 0.6637, + "mean_token_accuracy": 0.7953526675701141, + "num_tokens": 185574857.0, + "step": 78600 + }, + { + "epoch": 0.7207298065462547, + "learning_rate": 5.585587237553864e-05, + "loss": 0.6884, + "mean_token_accuracy": 0.7841347217559814, + "num_tokens": 185600589.0, + "step": 78610 + }, + { + "epoch": 0.720821490785734, + "learning_rate": 5.58375355276428e-05, + "loss": 0.6725, + "mean_token_accuracy": 0.7924810409545898, + "num_tokens": 185626131.0, + "step": 78620 + }, + { + "epoch": 0.7209131750252131, + "learning_rate": 5.581919867974695e-05, + "loss": 0.739, + "mean_token_accuracy": 0.7724352061748505, + "num_tokens": 185650834.0, + "step": 78630 + }, + { + "epoch": 0.7210048592646924, + "learning_rate": 5.5800861831851104e-05, + "loss": 0.7, + "mean_token_accuracy": 0.7873457729816437, + "num_tokens": 185675546.0, + "step": 78640 + }, + { + "epoch": 0.7210965435041716, + "learning_rate": 5.578252498395526e-05, + "loss": 0.7074, + "mean_token_accuracy": 0.7801327109336853, + "num_tokens": 185700499.0, + "step": 78650 + }, + { + "epoch": 0.7211882277436509, + "learning_rate": 5.5764188136059415e-05, + "loss": 0.6962, + "mean_token_accuracy": 0.7899401545524597, + "num_tokens": 185725749.0, + "step": 78660 + }, + { + "epoch": 0.7212799119831301, + "learning_rate": 5.574585128816357e-05, + "loss": 0.6895, + "mean_token_accuracy": 0.7878952562808991, + "num_tokens": 185751311.0, + "step": 78670 + }, + { + "epoch": 0.7213715962226094, + "learning_rate": 5.5727514440267725e-05, + "loss": 0.6718, + "mean_token_accuracy": 0.7948323488235474, + "num_tokens": 185776398.0, + "step": 78680 + }, + { + "epoch": 0.7214632804620885, + "learning_rate": 5.570917759237188e-05, + "loss": 0.6829, + "mean_token_accuracy": 0.788807487487793, + "num_tokens": 185801653.0, + "step": 78690 + }, + { + "epoch": 0.7215549647015678, + "learning_rate": 5.569084074447602e-05, + "loss": 0.6704, + "mean_token_accuracy": 0.7911393821239472, + "num_tokens": 185826353.0, + "step": 78700 + }, + { + "epoch": 0.721646648941047, + "learning_rate": 5.567250389658019e-05, + "loss": 0.6506, + "mean_token_accuracy": 0.7973729252815247, + "num_tokens": 185851793.0, + "step": 78710 + }, + { + "epoch": 0.7217383331805263, + "learning_rate": 5.565416704868433e-05, + "loss": 0.6958, + "mean_token_accuracy": 0.7847602307796478, + "num_tokens": 185876706.0, + "step": 78720 + }, + { + "epoch": 0.7218300174200055, + "learning_rate": 5.5635830200788485e-05, + "loss": 0.679, + "mean_token_accuracy": 0.7909967482089997, + "num_tokens": 185901364.0, + "step": 78730 + }, + { + "epoch": 0.7219217016594848, + "learning_rate": 5.561749335289264e-05, + "loss": 0.6357, + "mean_token_accuracy": 0.8032341659069061, + "num_tokens": 185926419.0, + "step": 78740 + }, + { + "epoch": 0.722013385898964, + "learning_rate": 5.5599156504996795e-05, + "loss": 0.6583, + "mean_token_accuracy": 0.7890056610107422, + "num_tokens": 185952069.0, + "step": 78750 + }, + { + "epoch": 0.7221050701384432, + "learning_rate": 5.558081965710095e-05, + "loss": 0.6903, + "mean_token_accuracy": 0.7933500289916993, + "num_tokens": 185976944.0, + "step": 78760 + }, + { + "epoch": 0.7221967543779224, + "learning_rate": 5.55624828092051e-05, + "loss": 0.6541, + "mean_token_accuracy": 0.7989000022411347, + "num_tokens": 186002291.0, + "step": 78770 + }, + { + "epoch": 0.7222884386174017, + "learning_rate": 5.554414596130926e-05, + "loss": 0.6555, + "mean_token_accuracy": 0.793702495098114, + "num_tokens": 186026919.0, + "step": 78780 + }, + { + "epoch": 0.7223801228568809, + "learning_rate": 5.552580911341341e-05, + "loss": 0.6872, + "mean_token_accuracy": 0.789022421836853, + "num_tokens": 186051340.0, + "step": 78790 + }, + { + "epoch": 0.7224718070963602, + "learning_rate": 5.5507472265517555e-05, + "loss": 0.6527, + "mean_token_accuracy": 0.7955657958984375, + "num_tokens": 186076872.0, + "step": 78800 + }, + { + "epoch": 0.7225634913358394, + "learning_rate": 5.548913541762172e-05, + "loss": 0.6916, + "mean_token_accuracy": 0.7900915682315827, + "num_tokens": 186101860.0, + "step": 78810 + }, + { + "epoch": 0.7226551755753186, + "learning_rate": 5.5470798569725865e-05, + "loss": 0.6668, + "mean_token_accuracy": 0.7958865940570832, + "num_tokens": 186127330.0, + "step": 78820 + }, + { + "epoch": 0.7227468598147978, + "learning_rate": 5.545246172183002e-05, + "loss": 0.6644, + "mean_token_accuracy": 0.7916256606578826, + "num_tokens": 186152052.0, + "step": 78830 + }, + { + "epoch": 0.722838544054277, + "learning_rate": 5.543412487393417e-05, + "loss": 0.7049, + "mean_token_accuracy": 0.7891476035118103, + "num_tokens": 186177014.0, + "step": 78840 + }, + { + "epoch": 0.7229302282937563, + "learning_rate": 5.541578802603833e-05, + "loss": 0.6732, + "mean_token_accuracy": 0.7945551216602326, + "num_tokens": 186201813.0, + "step": 78850 + }, + { + "epoch": 0.7230219125332356, + "learning_rate": 5.539745117814248e-05, + "loss": 0.7291, + "mean_token_accuracy": 0.7831566095352173, + "num_tokens": 186226559.0, + "step": 78860 + }, + { + "epoch": 0.7231135967727148, + "learning_rate": 5.537911433024663e-05, + "loss": 0.6861, + "mean_token_accuracy": 0.7860622882843018, + "num_tokens": 186252464.0, + "step": 78870 + }, + { + "epoch": 0.7232052810121941, + "learning_rate": 5.536077748235079e-05, + "loss": 0.6671, + "mean_token_accuracy": 0.791435694694519, + "num_tokens": 186277649.0, + "step": 78880 + }, + { + "epoch": 0.7232969652516732, + "learning_rate": 5.534244063445494e-05, + "loss": 0.6624, + "mean_token_accuracy": 0.7957864880561829, + "num_tokens": 186303861.0, + "step": 78890 + }, + { + "epoch": 0.7233886494911524, + "learning_rate": 5.532410378655909e-05, + "loss": 0.6504, + "mean_token_accuracy": 0.7934846758842469, + "num_tokens": 186329435.0, + "step": 78900 + }, + { + "epoch": 0.7234803337306317, + "learning_rate": 5.530576693866325e-05, + "loss": 0.6774, + "mean_token_accuracy": 0.7886178255081177, + "num_tokens": 186355071.0, + "step": 78910 + }, + { + "epoch": 0.723572017970111, + "learning_rate": 5.52874300907674e-05, + "loss": 0.7046, + "mean_token_accuracy": 0.7809918045997619, + "num_tokens": 186380489.0, + "step": 78920 + }, + { + "epoch": 0.7236637022095902, + "learning_rate": 5.526909324287155e-05, + "loss": 0.6755, + "mean_token_accuracy": 0.7858296811580658, + "num_tokens": 186405377.0, + "step": 78930 + }, + { + "epoch": 0.7237553864490694, + "learning_rate": 5.525075639497571e-05, + "loss": 0.6941, + "mean_token_accuracy": 0.7824526309967041, + "num_tokens": 186430471.0, + "step": 78940 + }, + { + "epoch": 0.7238470706885486, + "learning_rate": 5.523241954707986e-05, + "loss": 0.667, + "mean_token_accuracy": 0.7918890476226806, + "num_tokens": 186456585.0, + "step": 78950 + }, + { + "epoch": 0.7239387549280278, + "learning_rate": 5.521408269918401e-05, + "loss": 0.6809, + "mean_token_accuracy": 0.7902523100376129, + "num_tokens": 186481110.0, + "step": 78960 + }, + { + "epoch": 0.7240304391675071, + "learning_rate": 5.5195745851288163e-05, + "loss": 0.6793, + "mean_token_accuracy": 0.7880862593650818, + "num_tokens": 186505364.0, + "step": 78970 + }, + { + "epoch": 0.7241221234069863, + "learning_rate": 5.517740900339232e-05, + "loss": 0.6652, + "mean_token_accuracy": 0.7870647728443145, + "num_tokens": 186530464.0, + "step": 78980 + }, + { + "epoch": 0.7242138076464656, + "learning_rate": 5.5159072155496474e-05, + "loss": 0.6807, + "mean_token_accuracy": 0.788888442516327, + "num_tokens": 186555351.0, + "step": 78990 + }, + { + "epoch": 0.7243054918859448, + "learning_rate": 5.514073530760062e-05, + "loss": 0.6564, + "mean_token_accuracy": 0.7987925112247467, + "num_tokens": 186580817.0, + "step": 79000 + }, + { + "epoch": 0.7243971761254241, + "learning_rate": 5.5122398459704785e-05, + "loss": 0.6549, + "mean_token_accuracy": 0.7931228756904602, + "num_tokens": 186605941.0, + "step": 79010 + }, + { + "epoch": 0.7244888603649032, + "learning_rate": 5.510406161180893e-05, + "loss": 0.6836, + "mean_token_accuracy": 0.7867121160030365, + "num_tokens": 186630863.0, + "step": 79020 + }, + { + "epoch": 0.7245805446043825, + "learning_rate": 5.508572476391308e-05, + "loss": 0.7233, + "mean_token_accuracy": 0.7841231107711792, + "num_tokens": 186656597.0, + "step": 79030 + }, + { + "epoch": 0.7246722288438617, + "learning_rate": 5.506738791601724e-05, + "loss": 0.6919, + "mean_token_accuracy": 0.7882936596870422, + "num_tokens": 186682475.0, + "step": 79040 + }, + { + "epoch": 0.724763913083341, + "learning_rate": 5.504905106812139e-05, + "loss": 0.6513, + "mean_token_accuracy": 0.7978208243846894, + "num_tokens": 186707856.0, + "step": 79050 + }, + { + "epoch": 0.7248555973228202, + "learning_rate": 5.5030714220225544e-05, + "loss": 0.6796, + "mean_token_accuracy": 0.7892354786396026, + "num_tokens": 186732330.0, + "step": 79060 + }, + { + "epoch": 0.7249472815622995, + "learning_rate": 5.50123773723297e-05, + "loss": 0.683, + "mean_token_accuracy": 0.7898118734359741, + "num_tokens": 186757324.0, + "step": 79070 + }, + { + "epoch": 0.7250389658017786, + "learning_rate": 5.4994040524433854e-05, + "loss": 0.6786, + "mean_token_accuracy": 0.7866646826267243, + "num_tokens": 186782426.0, + "step": 79080 + }, + { + "epoch": 0.7251306500412579, + "learning_rate": 5.4975703676538006e-05, + "loss": 0.6582, + "mean_token_accuracy": 0.7960130989551544, + "num_tokens": 186808127.0, + "step": 79090 + }, + { + "epoch": 0.7252223342807371, + "learning_rate": 5.495736682864215e-05, + "loss": 0.7164, + "mean_token_accuracy": 0.7812751412391663, + "num_tokens": 186833079.0, + "step": 79100 + }, + { + "epoch": 0.7253140185202164, + "learning_rate": 5.493902998074632e-05, + "loss": 0.6752, + "mean_token_accuracy": 0.7962970733642578, + "num_tokens": 186858565.0, + "step": 79110 + }, + { + "epoch": 0.7254057027596956, + "learning_rate": 5.492069313285046e-05, + "loss": 0.674, + "mean_token_accuracy": 0.7864541113376617, + "num_tokens": 186883852.0, + "step": 79120 + }, + { + "epoch": 0.7254973869991749, + "learning_rate": 5.4902356284954614e-05, + "loss": 0.6894, + "mean_token_accuracy": 0.7863449811935425, + "num_tokens": 186909679.0, + "step": 79130 + }, + { + "epoch": 0.7255890712386541, + "learning_rate": 5.488401943705877e-05, + "loss": 0.6794, + "mean_token_accuracy": 0.7928593873977661, + "num_tokens": 186934040.0, + "step": 79140 + }, + { + "epoch": 0.7256807554781333, + "learning_rate": 5.4865682589162924e-05, + "loss": 0.6579, + "mean_token_accuracy": 0.793781453371048, + "num_tokens": 186958758.0, + "step": 79150 + }, + { + "epoch": 0.7257724397176125, + "learning_rate": 5.4847345741267076e-05, + "loss": 0.6897, + "mean_token_accuracy": 0.7864092826843262, + "num_tokens": 186983248.0, + "step": 79160 + }, + { + "epoch": 0.7258641239570918, + "learning_rate": 5.4829008893371235e-05, + "loss": 0.6874, + "mean_token_accuracy": 0.7873319625854492, + "num_tokens": 187008200.0, + "step": 79170 + }, + { + "epoch": 0.725955808196571, + "learning_rate": 5.4810672045475387e-05, + "loss": 0.7107, + "mean_token_accuracy": 0.7863698482513428, + "num_tokens": 187033568.0, + "step": 79180 + }, + { + "epoch": 0.7260474924360503, + "learning_rate": 5.479233519757954e-05, + "loss": 0.6627, + "mean_token_accuracy": 0.7947986125946045, + "num_tokens": 187058239.0, + "step": 79190 + }, + { + "epoch": 0.7261391766755295, + "learning_rate": 5.47739983496837e-05, + "loss": 0.6536, + "mean_token_accuracy": 0.7928597748279571, + "num_tokens": 187083095.0, + "step": 79200 + }, + { + "epoch": 0.7262308609150087, + "learning_rate": 5.475566150178785e-05, + "loss": 0.6224, + "mean_token_accuracy": 0.8028665602207183, + "num_tokens": 187108524.0, + "step": 79210 + }, + { + "epoch": 0.7263225451544879, + "learning_rate": 5.4737324653891994e-05, + "loss": 0.653, + "mean_token_accuracy": 0.8016027867794037, + "num_tokens": 187133647.0, + "step": 79220 + }, + { + "epoch": 0.7264142293939672, + "learning_rate": 5.4718987805996146e-05, + "loss": 0.7373, + "mean_token_accuracy": 0.7745027780532837, + "num_tokens": 187158796.0, + "step": 79230 + }, + { + "epoch": 0.7265059136334464, + "learning_rate": 5.4700650958100305e-05, + "loss": 0.7257, + "mean_token_accuracy": 0.7769539535045624, + "num_tokens": 187183073.0, + "step": 79240 + }, + { + "epoch": 0.7265975978729257, + "learning_rate": 5.4682314110204456e-05, + "loss": 0.686, + "mean_token_accuracy": 0.7857530534267425, + "num_tokens": 187208311.0, + "step": 79250 + }, + { + "epoch": 0.7266892821124049, + "learning_rate": 5.466397726230861e-05, + "loss": 0.6749, + "mean_token_accuracy": 0.7894758582115173, + "num_tokens": 187233143.0, + "step": 79260 + }, + { + "epoch": 0.7267809663518842, + "learning_rate": 5.464564041441277e-05, + "loss": 0.6843, + "mean_token_accuracy": 0.7927349925041198, + "num_tokens": 187257810.0, + "step": 79270 + }, + { + "epoch": 0.7268726505913633, + "learning_rate": 5.462730356651692e-05, + "loss": 0.6607, + "mean_token_accuracy": 0.8018940210342407, + "num_tokens": 187283158.0, + "step": 79280 + }, + { + "epoch": 0.7269643348308426, + "learning_rate": 5.460896671862107e-05, + "loss": 0.6781, + "mean_token_accuracy": 0.7852358162403107, + "num_tokens": 187308925.0, + "step": 79290 + }, + { + "epoch": 0.7270560190703218, + "learning_rate": 5.459062987072523e-05, + "loss": 0.6915, + "mean_token_accuracy": 0.7866684913635253, + "num_tokens": 187333988.0, + "step": 79300 + }, + { + "epoch": 0.727147703309801, + "learning_rate": 5.457229302282938e-05, + "loss": 0.6616, + "mean_token_accuracy": 0.7948778569698334, + "num_tokens": 187358668.0, + "step": 79310 + }, + { + "epoch": 0.7272393875492803, + "learning_rate": 5.4553956174933526e-05, + "loss": 0.6912, + "mean_token_accuracy": 0.7864884972572327, + "num_tokens": 187383966.0, + "step": 79320 + }, + { + "epoch": 0.7273310717887596, + "learning_rate": 5.453561932703769e-05, + "loss": 0.6864, + "mean_token_accuracy": 0.7897108733654022, + "num_tokens": 187409724.0, + "step": 79330 + }, + { + "epoch": 0.7274227560282387, + "learning_rate": 5.451728247914184e-05, + "loss": 0.6758, + "mean_token_accuracy": 0.7939182937145233, + "num_tokens": 187434764.0, + "step": 79340 + }, + { + "epoch": 0.7275144402677179, + "learning_rate": 5.449894563124599e-05, + "loss": 0.6694, + "mean_token_accuracy": 0.7932112634181976, + "num_tokens": 187459904.0, + "step": 79350 + }, + { + "epoch": 0.7276061245071972, + "learning_rate": 5.448060878335014e-05, + "loss": 0.6839, + "mean_token_accuracy": 0.7892306923866272, + "num_tokens": 187484285.0, + "step": 79360 + }, + { + "epoch": 0.7276978087466764, + "learning_rate": 5.44622719354543e-05, + "loss": 0.6938, + "mean_token_accuracy": 0.7868093073368072, + "num_tokens": 187508917.0, + "step": 79370 + }, + { + "epoch": 0.7277894929861557, + "learning_rate": 5.444393508755845e-05, + "loss": 0.6741, + "mean_token_accuracy": 0.7889336228370667, + "num_tokens": 187533158.0, + "step": 79380 + }, + { + "epoch": 0.727881177225635, + "learning_rate": 5.44255982396626e-05, + "loss": 0.6848, + "mean_token_accuracy": 0.7920760989189148, + "num_tokens": 187558298.0, + "step": 79390 + }, + { + "epoch": 0.7279728614651142, + "learning_rate": 5.440726139176676e-05, + "loss": 0.699, + "mean_token_accuracy": 0.786843329668045, + "num_tokens": 187582384.0, + "step": 79400 + }, + { + "epoch": 0.7280645457045933, + "learning_rate": 5.4388924543870913e-05, + "loss": 0.6537, + "mean_token_accuracy": 0.7969779133796692, + "num_tokens": 187606863.0, + "step": 79410 + }, + { + "epoch": 0.7281562299440726, + "learning_rate": 5.437058769597506e-05, + "loss": 0.6615, + "mean_token_accuracy": 0.7937743186950683, + "num_tokens": 187631978.0, + "step": 79420 + }, + { + "epoch": 0.7282479141835518, + "learning_rate": 5.4352250848079224e-05, + "loss": 0.6863, + "mean_token_accuracy": 0.788418835401535, + "num_tokens": 187657222.0, + "step": 79430 + }, + { + "epoch": 0.7283395984230311, + "learning_rate": 5.433391400018337e-05, + "loss": 0.6521, + "mean_token_accuracy": 0.7989540219306945, + "num_tokens": 187682955.0, + "step": 79440 + }, + { + "epoch": 0.7284312826625103, + "learning_rate": 5.431557715228752e-05, + "loss": 0.6683, + "mean_token_accuracy": 0.7878883302211761, + "num_tokens": 187708001.0, + "step": 79450 + }, + { + "epoch": 0.7285229669019896, + "learning_rate": 5.429724030439167e-05, + "loss": 0.6394, + "mean_token_accuracy": 0.8020074605941773, + "num_tokens": 187733155.0, + "step": 79460 + }, + { + "epoch": 0.7286146511414687, + "learning_rate": 5.427890345649583e-05, + "loss": 0.675, + "mean_token_accuracy": 0.7911485075950623, + "num_tokens": 187757810.0, + "step": 79470 + }, + { + "epoch": 0.728706335380948, + "learning_rate": 5.426056660859998e-05, + "loss": 0.6423, + "mean_token_accuracy": 0.8018137454986572, + "num_tokens": 187783479.0, + "step": 79480 + }, + { + "epoch": 0.7287980196204272, + "learning_rate": 5.4242229760704135e-05, + "loss": 0.7191, + "mean_token_accuracy": 0.7751696288585663, + "num_tokens": 187808545.0, + "step": 79490 + }, + { + "epoch": 0.7288897038599065, + "learning_rate": 5.4223892912808294e-05, + "loss": 0.678, + "mean_token_accuracy": 0.7919573366641999, + "num_tokens": 187832865.0, + "step": 79500 + }, + { + "epoch": 0.7289813880993857, + "learning_rate": 5.4205556064912446e-05, + "loss": 0.6883, + "mean_token_accuracy": 0.7857295870780945, + "num_tokens": 187858257.0, + "step": 79510 + }, + { + "epoch": 0.729073072338865, + "learning_rate": 5.418721921701659e-05, + "loss": 0.7078, + "mean_token_accuracy": 0.7824679374694824, + "num_tokens": 187883762.0, + "step": 79520 + }, + { + "epoch": 0.7291647565783442, + "learning_rate": 5.4168882369120756e-05, + "loss": 0.6654, + "mean_token_accuracy": 0.7948396861553192, + "num_tokens": 187909411.0, + "step": 79530 + }, + { + "epoch": 0.7292564408178234, + "learning_rate": 5.415054552122491e-05, + "loss": 0.6835, + "mean_token_accuracy": 0.7936994552612304, + "num_tokens": 187934935.0, + "step": 79540 + }, + { + "epoch": 0.7293481250573026, + "learning_rate": 5.413220867332905e-05, + "loss": 0.6583, + "mean_token_accuracy": 0.7967337548732758, + "num_tokens": 187960807.0, + "step": 79550 + }, + { + "epoch": 0.7294398092967819, + "learning_rate": 5.411387182543322e-05, + "loss": 0.7154, + "mean_token_accuracy": 0.7844775915145874, + "num_tokens": 187985519.0, + "step": 79560 + }, + { + "epoch": 0.7295314935362611, + "learning_rate": 5.4095534977537364e-05, + "loss": 0.6693, + "mean_token_accuracy": 0.7947754561901093, + "num_tokens": 188010595.0, + "step": 79570 + }, + { + "epoch": 0.7296231777757404, + "learning_rate": 5.4077198129641516e-05, + "loss": 0.6715, + "mean_token_accuracy": 0.7909493327140809, + "num_tokens": 188035749.0, + "step": 79580 + }, + { + "epoch": 0.7297148620152196, + "learning_rate": 5.405886128174567e-05, + "loss": 0.6849, + "mean_token_accuracy": 0.7898952901363373, + "num_tokens": 188061378.0, + "step": 79590 + }, + { + "epoch": 0.7298065462546988, + "learning_rate": 5.4040524433849826e-05, + "loss": 0.6771, + "mean_token_accuracy": 0.7913882613182068, + "num_tokens": 188085486.0, + "step": 79600 + }, + { + "epoch": 0.729898230494178, + "learning_rate": 5.402218758595398e-05, + "loss": 0.6478, + "mean_token_accuracy": 0.7929193317890167, + "num_tokens": 188110385.0, + "step": 79610 + }, + { + "epoch": 0.7299899147336573, + "learning_rate": 5.400385073805812e-05, + "loss": 0.6686, + "mean_token_accuracy": 0.7889566123485565, + "num_tokens": 188136078.0, + "step": 79620 + }, + { + "epoch": 0.7300815989731365, + "learning_rate": 5.398551389016229e-05, + "loss": 0.6699, + "mean_token_accuracy": 0.7939992249011993, + "num_tokens": 188162378.0, + "step": 79630 + }, + { + "epoch": 0.7301732832126158, + "learning_rate": 5.396717704226644e-05, + "loss": 0.6702, + "mean_token_accuracy": 0.7892761111259461, + "num_tokens": 188187023.0, + "step": 79640 + }, + { + "epoch": 0.730264967452095, + "learning_rate": 5.3948840194370585e-05, + "loss": 0.6937, + "mean_token_accuracy": 0.7890453279018402, + "num_tokens": 188211766.0, + "step": 79650 + }, + { + "epoch": 0.7303566516915743, + "learning_rate": 5.393050334647475e-05, + "loss": 0.6807, + "mean_token_accuracy": 0.7881542801856994, + "num_tokens": 188237641.0, + "step": 79660 + }, + { + "epoch": 0.7304483359310534, + "learning_rate": 5.3912166498578896e-05, + "loss": 0.7006, + "mean_token_accuracy": 0.7916547179222106, + "num_tokens": 188262338.0, + "step": 79670 + }, + { + "epoch": 0.7305400201705327, + "learning_rate": 5.389382965068305e-05, + "loss": 0.6598, + "mean_token_accuracy": 0.795462167263031, + "num_tokens": 188288257.0, + "step": 79680 + }, + { + "epoch": 0.7306317044100119, + "learning_rate": 5.3875492802787206e-05, + "loss": 0.6559, + "mean_token_accuracy": 0.7956127762794495, + "num_tokens": 188313085.0, + "step": 79690 + }, + { + "epoch": 0.7307233886494912, + "learning_rate": 5.385715595489136e-05, + "loss": 0.7098, + "mean_token_accuracy": 0.7878253340721131, + "num_tokens": 188337592.0, + "step": 79700 + }, + { + "epoch": 0.7308150728889704, + "learning_rate": 5.383881910699551e-05, + "loss": 0.6787, + "mean_token_accuracy": 0.7885228514671325, + "num_tokens": 188363528.0, + "step": 79710 + }, + { + "epoch": 0.7309067571284497, + "learning_rate": 5.3820482259099655e-05, + "loss": 0.6931, + "mean_token_accuracy": 0.7864165544509888, + "num_tokens": 188389037.0, + "step": 79720 + }, + { + "epoch": 0.7309984413679289, + "learning_rate": 5.380214541120382e-05, + "loss": 0.6835, + "mean_token_accuracy": 0.7906298160552978, + "num_tokens": 188413023.0, + "step": 79730 + }, + { + "epoch": 0.731090125607408, + "learning_rate": 5.378380856330797e-05, + "loss": 0.7135, + "mean_token_accuracy": 0.7800632536411285, + "num_tokens": 188438215.0, + "step": 79740 + }, + { + "epoch": 0.7311818098468873, + "learning_rate": 5.376547171541212e-05, + "loss": 0.6874, + "mean_token_accuracy": 0.7926500022411347, + "num_tokens": 188463977.0, + "step": 79750 + }, + { + "epoch": 0.7312734940863665, + "learning_rate": 5.374713486751628e-05, + "loss": 0.6831, + "mean_token_accuracy": 0.7888989210128784, + "num_tokens": 188488445.0, + "step": 79760 + }, + { + "epoch": 0.7313651783258458, + "learning_rate": 5.372879801962043e-05, + "loss": 0.6517, + "mean_token_accuracy": 0.7938899755477905, + "num_tokens": 188513727.0, + "step": 79770 + }, + { + "epoch": 0.731456862565325, + "learning_rate": 5.371046117172458e-05, + "loss": 0.6637, + "mean_token_accuracy": 0.7909485876560212, + "num_tokens": 188539201.0, + "step": 79780 + }, + { + "epoch": 0.7315485468048043, + "learning_rate": 5.369212432382874e-05, + "loss": 0.6688, + "mean_token_accuracy": 0.7948606193065644, + "num_tokens": 188563571.0, + "step": 79790 + }, + { + "epoch": 0.7316402310442834, + "learning_rate": 5.367378747593289e-05, + "loss": 0.6606, + "mean_token_accuracy": 0.7913779854774475, + "num_tokens": 188588312.0, + "step": 79800 + }, + { + "epoch": 0.7317319152837627, + "learning_rate": 5.365545062803704e-05, + "loss": 0.6624, + "mean_token_accuracy": 0.7969732344150543, + "num_tokens": 188613882.0, + "step": 79810 + }, + { + "epoch": 0.7318235995232419, + "learning_rate": 5.36371137801412e-05, + "loss": 0.6948, + "mean_token_accuracy": 0.7828238844871521, + "num_tokens": 188639571.0, + "step": 79820 + }, + { + "epoch": 0.7319152837627212, + "learning_rate": 5.361877693224535e-05, + "loss": 0.6649, + "mean_token_accuracy": 0.7942383110523223, + "num_tokens": 188664226.0, + "step": 79830 + }, + { + "epoch": 0.7320069680022004, + "learning_rate": 5.3600440084349505e-05, + "loss": 0.6544, + "mean_token_accuracy": 0.7965122163295746, + "num_tokens": 188689153.0, + "step": 79840 + }, + { + "epoch": 0.7320986522416797, + "learning_rate": 5.358210323645365e-05, + "loss": 0.677, + "mean_token_accuracy": 0.7880686104297638, + "num_tokens": 188714115.0, + "step": 79850 + }, + { + "epoch": 0.7321903364811589, + "learning_rate": 5.3563766388557815e-05, + "loss": 0.7405, + "mean_token_accuracy": 0.7743090927600861, + "num_tokens": 188739708.0, + "step": 79860 + }, + { + "epoch": 0.7322820207206381, + "learning_rate": 5.354542954066196e-05, + "loss": 0.6461, + "mean_token_accuracy": 0.7960841357707977, + "num_tokens": 188765488.0, + "step": 79870 + }, + { + "epoch": 0.7323737049601173, + "learning_rate": 5.352709269276611e-05, + "loss": 0.6588, + "mean_token_accuracy": 0.7978433609008789, + "num_tokens": 188790052.0, + "step": 79880 + }, + { + "epoch": 0.7324653891995966, + "learning_rate": 5.350875584487027e-05, + "loss": 0.7014, + "mean_token_accuracy": 0.7835223853588105, + "num_tokens": 188815253.0, + "step": 79890 + }, + { + "epoch": 0.7325570734390758, + "learning_rate": 5.349041899697442e-05, + "loss": 0.6699, + "mean_token_accuracy": 0.7923356831073761, + "num_tokens": 188840657.0, + "step": 79900 + }, + { + "epoch": 0.7326487576785551, + "learning_rate": 5.3472082149078575e-05, + "loss": 0.6786, + "mean_token_accuracy": 0.7936592340469361, + "num_tokens": 188866276.0, + "step": 79910 + }, + { + "epoch": 0.7327404419180343, + "learning_rate": 5.345374530118273e-05, + "loss": 0.6856, + "mean_token_accuracy": 0.7864917993545533, + "num_tokens": 188891612.0, + "step": 79920 + }, + { + "epoch": 0.7328321261575135, + "learning_rate": 5.3435408453286885e-05, + "loss": 0.636, + "mean_token_accuracy": 0.8033297240734101, + "num_tokens": 188917104.0, + "step": 79930 + }, + { + "epoch": 0.7329238103969927, + "learning_rate": 5.341707160539104e-05, + "loss": 0.6569, + "mean_token_accuracy": 0.7944091916084289, + "num_tokens": 188941870.0, + "step": 79940 + }, + { + "epoch": 0.733015494636472, + "learning_rate": 5.3398734757495196e-05, + "loss": 0.6729, + "mean_token_accuracy": 0.7910976231098175, + "num_tokens": 188966674.0, + "step": 79950 + }, + { + "epoch": 0.7331071788759512, + "learning_rate": 5.338039790959935e-05, + "loss": 0.6593, + "mean_token_accuracy": 0.7933946967124939, + "num_tokens": 188992114.0, + "step": 79960 + }, + { + "epoch": 0.7331988631154305, + "learning_rate": 5.336206106170349e-05, + "loss": 0.6451, + "mean_token_accuracy": 0.8009393155574799, + "num_tokens": 189017131.0, + "step": 79970 + }, + { + "epoch": 0.7332905473549097, + "learning_rate": 5.3343724213807644e-05, + "loss": 0.6532, + "mean_token_accuracy": 0.7954998254776001, + "num_tokens": 189041900.0, + "step": 79980 + }, + { + "epoch": 0.733382231594389, + "learning_rate": 5.33253873659118e-05, + "loss": 0.7007, + "mean_token_accuracy": 0.7831595361232757, + "num_tokens": 189066439.0, + "step": 79990 + }, + { + "epoch": 0.7334739158338681, + "learning_rate": 5.3307050518015955e-05, + "loss": 0.675, + "mean_token_accuracy": 0.7911353826522827, + "num_tokens": 189091733.0, + "step": 80000 + }, + { + "epoch": 0.7335656000733474, + "learning_rate": 5.328871367012011e-05, + "loss": 0.6725, + "mean_token_accuracy": 0.7923921167850494, + "num_tokens": 189117742.0, + "step": 80010 + }, + { + "epoch": 0.7336572843128266, + "learning_rate": 5.3270376822224265e-05, + "loss": 0.6875, + "mean_token_accuracy": 0.7831376135349274, + "num_tokens": 189143435.0, + "step": 80020 + }, + { + "epoch": 0.7337489685523059, + "learning_rate": 5.325203997432842e-05, + "loss": 0.7023, + "mean_token_accuracy": 0.7888618469238281, + "num_tokens": 189168928.0, + "step": 80030 + }, + { + "epoch": 0.7338406527917851, + "learning_rate": 5.323370312643257e-05, + "loss": 0.6345, + "mean_token_accuracy": 0.801346880197525, + "num_tokens": 189194610.0, + "step": 80040 + }, + { + "epoch": 0.7339323370312644, + "learning_rate": 5.321536627853673e-05, + "loss": 0.7002, + "mean_token_accuracy": 0.7882979094982148, + "num_tokens": 189219652.0, + "step": 80050 + }, + { + "epoch": 0.7340240212707435, + "learning_rate": 5.319702943064088e-05, + "loss": 0.6795, + "mean_token_accuracy": 0.7905156254768372, + "num_tokens": 189244274.0, + "step": 80060 + }, + { + "epoch": 0.7341157055102228, + "learning_rate": 5.3178692582745025e-05, + "loss": 0.6471, + "mean_token_accuracy": 0.8073345959186554, + "num_tokens": 189269626.0, + "step": 80070 + }, + { + "epoch": 0.734207389749702, + "learning_rate": 5.316035573484918e-05, + "loss": 0.6737, + "mean_token_accuracy": 0.792496246099472, + "num_tokens": 189295147.0, + "step": 80080 + }, + { + "epoch": 0.7342990739891813, + "learning_rate": 5.3142018886953335e-05, + "loss": 0.6483, + "mean_token_accuracy": 0.7981096088886261, + "num_tokens": 189320059.0, + "step": 80090 + }, + { + "epoch": 0.7343907582286605, + "learning_rate": 5.312368203905749e-05, + "loss": 0.6817, + "mean_token_accuracy": 0.7924897193908691, + "num_tokens": 189346014.0, + "step": 80100 + }, + { + "epoch": 0.7344824424681398, + "learning_rate": 5.310534519116164e-05, + "loss": 0.6588, + "mean_token_accuracy": 0.7879400074481964, + "num_tokens": 189370992.0, + "step": 80110 + }, + { + "epoch": 0.734574126707619, + "learning_rate": 5.30870083432658e-05, + "loss": 0.6527, + "mean_token_accuracy": 0.7944809854030609, + "num_tokens": 189395670.0, + "step": 80120 + }, + { + "epoch": 0.7346658109470982, + "learning_rate": 5.306867149536995e-05, + "loss": 0.677, + "mean_token_accuracy": 0.7863703429698944, + "num_tokens": 189420540.0, + "step": 80130 + }, + { + "epoch": 0.7347574951865774, + "learning_rate": 5.30503346474741e-05, + "loss": 0.6632, + "mean_token_accuracy": 0.7973880887031555, + "num_tokens": 189445936.0, + "step": 80140 + }, + { + "epoch": 0.7348491794260567, + "learning_rate": 5.303199779957826e-05, + "loss": 0.7363, + "mean_token_accuracy": 0.7791323900222779, + "num_tokens": 189470074.0, + "step": 80150 + }, + { + "epoch": 0.7349408636655359, + "learning_rate": 5.301366095168241e-05, + "loss": 0.6967, + "mean_token_accuracy": 0.780820369720459, + "num_tokens": 189495225.0, + "step": 80160 + }, + { + "epoch": 0.7350325479050152, + "learning_rate": 5.299532410378656e-05, + "loss": 0.6859, + "mean_token_accuracy": 0.7911755859851837, + "num_tokens": 189520377.0, + "step": 80170 + }, + { + "epoch": 0.7351242321444944, + "learning_rate": 5.297698725589072e-05, + "loss": 0.6969, + "mean_token_accuracy": 0.7861814081668854, + "num_tokens": 189545211.0, + "step": 80180 + }, + { + "epoch": 0.7352159163839735, + "learning_rate": 5.295865040799487e-05, + "loss": 0.7017, + "mean_token_accuracy": 0.7866884708404541, + "num_tokens": 189569528.0, + "step": 80190 + }, + { + "epoch": 0.7353076006234528, + "learning_rate": 5.294031356009902e-05, + "loss": 0.656, + "mean_token_accuracy": 0.7965950012207031, + "num_tokens": 189593828.0, + "step": 80200 + }, + { + "epoch": 0.735399284862932, + "learning_rate": 5.292197671220317e-05, + "loss": 0.6496, + "mean_token_accuracy": 0.7972586572170257, + "num_tokens": 189619342.0, + "step": 80210 + }, + { + "epoch": 0.7354909691024113, + "learning_rate": 5.290363986430733e-05, + "loss": 0.6844, + "mean_token_accuracy": 0.7861582815647126, + "num_tokens": 189644553.0, + "step": 80220 + }, + { + "epoch": 0.7355826533418905, + "learning_rate": 5.288530301641148e-05, + "loss": 0.6955, + "mean_token_accuracy": 0.789175671339035, + "num_tokens": 189669080.0, + "step": 80230 + }, + { + "epoch": 0.7356743375813698, + "learning_rate": 5.2866966168515634e-05, + "loss": 0.7158, + "mean_token_accuracy": 0.7790573120117188, + "num_tokens": 189693329.0, + "step": 80240 + }, + { + "epoch": 0.735766021820849, + "learning_rate": 5.284862932061979e-05, + "loss": 0.6777, + "mean_token_accuracy": 0.7848819613456726, + "num_tokens": 189718376.0, + "step": 80250 + }, + { + "epoch": 0.7358577060603282, + "learning_rate": 5.2830292472723944e-05, + "loss": 0.685, + "mean_token_accuracy": 0.7896092176437378, + "num_tokens": 189743345.0, + "step": 80260 + }, + { + "epoch": 0.7359493902998074, + "learning_rate": 5.281195562482809e-05, + "loss": 0.7118, + "mean_token_accuracy": 0.7788365304470062, + "num_tokens": 189768513.0, + "step": 80270 + }, + { + "epoch": 0.7360410745392867, + "learning_rate": 5.2793618776932255e-05, + "loss": 0.6942, + "mean_token_accuracy": 0.7790515959262848, + "num_tokens": 189792843.0, + "step": 80280 + }, + { + "epoch": 0.7361327587787659, + "learning_rate": 5.27752819290364e-05, + "loss": 0.6719, + "mean_token_accuracy": 0.7966277360916137, + "num_tokens": 189817526.0, + "step": 80290 + }, + { + "epoch": 0.7362244430182452, + "learning_rate": 5.275694508114055e-05, + "loss": 0.6863, + "mean_token_accuracy": 0.7920669257640839, + "num_tokens": 189842854.0, + "step": 80300 + }, + { + "epoch": 0.7363161272577244, + "learning_rate": 5.273860823324471e-05, + "loss": 0.6438, + "mean_token_accuracy": 0.7960306406021118, + "num_tokens": 189867998.0, + "step": 80310 + }, + { + "epoch": 0.7364078114972036, + "learning_rate": 5.272027138534886e-05, + "loss": 0.675, + "mean_token_accuracy": 0.7901750206947327, + "num_tokens": 189893032.0, + "step": 80320 + }, + { + "epoch": 0.7364994957366828, + "learning_rate": 5.2701934537453014e-05, + "loss": 0.6655, + "mean_token_accuracy": 0.7903243482112885, + "num_tokens": 189917930.0, + "step": 80330 + }, + { + "epoch": 0.7365911799761621, + "learning_rate": 5.2683597689557166e-05, + "loss": 0.6882, + "mean_token_accuracy": 0.7891256392002106, + "num_tokens": 189942763.0, + "step": 80340 + }, + { + "epoch": 0.7366828642156413, + "learning_rate": 5.2665260841661324e-05, + "loss": 0.6675, + "mean_token_accuracy": 0.7998230636119843, + "num_tokens": 189968362.0, + "step": 80350 + }, + { + "epoch": 0.7367745484551206, + "learning_rate": 5.2646923993765476e-05, + "loss": 0.6689, + "mean_token_accuracy": 0.7921317398548127, + "num_tokens": 189994107.0, + "step": 80360 + }, + { + "epoch": 0.7368662326945998, + "learning_rate": 5.262858714586962e-05, + "loss": 0.6829, + "mean_token_accuracy": 0.7936067163944245, + "num_tokens": 190019056.0, + "step": 80370 + }, + { + "epoch": 0.7369579169340791, + "learning_rate": 5.261025029797379e-05, + "loss": 0.6836, + "mean_token_accuracy": 0.7922172784805298, + "num_tokens": 190044149.0, + "step": 80380 + }, + { + "epoch": 0.7370496011735582, + "learning_rate": 5.259191345007793e-05, + "loss": 0.726, + "mean_token_accuracy": 0.783193153142929, + "num_tokens": 190069332.0, + "step": 80390 + }, + { + "epoch": 0.7371412854130375, + "learning_rate": 5.2573576602182084e-05, + "loss": 0.6944, + "mean_token_accuracy": 0.7866541266441345, + "num_tokens": 190095058.0, + "step": 80400 + }, + { + "epoch": 0.7372329696525167, + "learning_rate": 5.255523975428624e-05, + "loss": 0.7162, + "mean_token_accuracy": 0.7798259079456329, + "num_tokens": 190119728.0, + "step": 80410 + }, + { + "epoch": 0.737324653891996, + "learning_rate": 5.2536902906390394e-05, + "loss": 0.6717, + "mean_token_accuracy": 0.7873007714748382, + "num_tokens": 190145020.0, + "step": 80420 + }, + { + "epoch": 0.7374163381314752, + "learning_rate": 5.2518566058494546e-05, + "loss": 0.6984, + "mean_token_accuracy": 0.7886401295661927, + "num_tokens": 190169938.0, + "step": 80430 + }, + { + "epoch": 0.7375080223709545, + "learning_rate": 5.2500229210598705e-05, + "loss": 0.6665, + "mean_token_accuracy": 0.7915529727935791, + "num_tokens": 190195735.0, + "step": 80440 + }, + { + "epoch": 0.7375997066104336, + "learning_rate": 5.248189236270286e-05, + "loss": 0.6613, + "mean_token_accuracy": 0.7929513573646545, + "num_tokens": 190221335.0, + "step": 80450 + }, + { + "epoch": 0.7376913908499129, + "learning_rate": 5.246355551480701e-05, + "loss": 0.6916, + "mean_token_accuracy": 0.7865171432495117, + "num_tokens": 190247419.0, + "step": 80460 + }, + { + "epoch": 0.7377830750893921, + "learning_rate": 5.2445218666911154e-05, + "loss": 0.6701, + "mean_token_accuracy": 0.7929346561431885, + "num_tokens": 190272489.0, + "step": 80470 + }, + { + "epoch": 0.7378747593288714, + "learning_rate": 5.242688181901532e-05, + "loss": 0.6675, + "mean_token_accuracy": 0.7921228289604187, + "num_tokens": 190297713.0, + "step": 80480 + }, + { + "epoch": 0.7379664435683506, + "learning_rate": 5.2408544971119464e-05, + "loss": 0.7003, + "mean_token_accuracy": 0.7888290166854859, + "num_tokens": 190322807.0, + "step": 80490 + }, + { + "epoch": 0.7380581278078299, + "learning_rate": 5.2390208123223616e-05, + "loss": 0.6652, + "mean_token_accuracy": 0.794892543554306, + "num_tokens": 190347267.0, + "step": 80500 + }, + { + "epoch": 0.7381498120473091, + "learning_rate": 5.2371871275327775e-05, + "loss": 0.702, + "mean_token_accuracy": 0.7819541871547699, + "num_tokens": 190372358.0, + "step": 80510 + }, + { + "epoch": 0.7382414962867883, + "learning_rate": 5.2353534427431927e-05, + "loss": 0.6504, + "mean_token_accuracy": 0.7943321585655212, + "num_tokens": 190397426.0, + "step": 80520 + }, + { + "epoch": 0.7383331805262675, + "learning_rate": 5.233519757953608e-05, + "loss": 0.6846, + "mean_token_accuracy": 0.7873305916786194, + "num_tokens": 190422588.0, + "step": 80530 + }, + { + "epoch": 0.7384248647657468, + "learning_rate": 5.231686073164024e-05, + "loss": 0.634, + "mean_token_accuracy": 0.7992035388946533, + "num_tokens": 190448233.0, + "step": 80540 + }, + { + "epoch": 0.738516549005226, + "learning_rate": 5.229852388374439e-05, + "loss": 0.6922, + "mean_token_accuracy": 0.7892242312431336, + "num_tokens": 190473498.0, + "step": 80550 + }, + { + "epoch": 0.7386082332447053, + "learning_rate": 5.228018703584854e-05, + "loss": 0.7053, + "mean_token_accuracy": 0.7846129417419434, + "num_tokens": 190499721.0, + "step": 80560 + }, + { + "epoch": 0.7386999174841845, + "learning_rate": 5.22618501879527e-05, + "loss": 0.6695, + "mean_token_accuracy": 0.7938514113426208, + "num_tokens": 190524438.0, + "step": 80570 + }, + { + "epoch": 0.7387916017236636, + "learning_rate": 5.224351334005685e-05, + "loss": 0.6859, + "mean_token_accuracy": 0.7834884047508239, + "num_tokens": 190549560.0, + "step": 80580 + }, + { + "epoch": 0.7388832859631429, + "learning_rate": 5.2225176492160996e-05, + "loss": 0.6764, + "mean_token_accuracy": 0.79319748878479, + "num_tokens": 190574271.0, + "step": 80590 + }, + { + "epoch": 0.7389749702026222, + "learning_rate": 5.220683964426515e-05, + "loss": 0.6765, + "mean_token_accuracy": 0.7932425737380981, + "num_tokens": 190599548.0, + "step": 80600 + }, + { + "epoch": 0.7390666544421014, + "learning_rate": 5.218850279636931e-05, + "loss": 0.6879, + "mean_token_accuracy": 0.7921907782554627, + "num_tokens": 190625290.0, + "step": 80610 + }, + { + "epoch": 0.7391583386815807, + "learning_rate": 5.217016594847346e-05, + "loss": 0.6744, + "mean_token_accuracy": 0.789624297618866, + "num_tokens": 190649458.0, + "step": 80620 + }, + { + "epoch": 0.7392500229210599, + "learning_rate": 5.215182910057761e-05, + "loss": 0.6833, + "mean_token_accuracy": 0.7908877253532409, + "num_tokens": 190674600.0, + "step": 80630 + }, + { + "epoch": 0.7393417071605392, + "learning_rate": 5.213349225268177e-05, + "loss": 0.6692, + "mean_token_accuracy": 0.7917872250080109, + "num_tokens": 190699891.0, + "step": 80640 + }, + { + "epoch": 0.7394333914000183, + "learning_rate": 5.211515540478592e-05, + "loss": 0.6839, + "mean_token_accuracy": 0.7962104916572571, + "num_tokens": 190724105.0, + "step": 80650 + }, + { + "epoch": 0.7395250756394975, + "learning_rate": 5.209681855689007e-05, + "loss": 0.6819, + "mean_token_accuracy": 0.7885459780693054, + "num_tokens": 190749063.0, + "step": 80660 + }, + { + "epoch": 0.7396167598789768, + "learning_rate": 5.207848170899423e-05, + "loss": 0.6524, + "mean_token_accuracy": 0.8003826260566711, + "num_tokens": 190773615.0, + "step": 80670 + }, + { + "epoch": 0.739708444118456, + "learning_rate": 5.2060144861098384e-05, + "loss": 0.6866, + "mean_token_accuracy": 0.7876509904861451, + "num_tokens": 190799197.0, + "step": 80680 + }, + { + "epoch": 0.7398001283579353, + "learning_rate": 5.204180801320253e-05, + "loss": 0.6871, + "mean_token_accuracy": 0.7913267910480499, + "num_tokens": 190824244.0, + "step": 80690 + }, + { + "epoch": 0.7398918125974145, + "learning_rate": 5.202347116530668e-05, + "loss": 0.7032, + "mean_token_accuracy": 0.7855749905109406, + "num_tokens": 190848853.0, + "step": 80700 + }, + { + "epoch": 0.7399834968368937, + "learning_rate": 5.200513431741084e-05, + "loss": 0.6792, + "mean_token_accuracy": 0.7900627136230469, + "num_tokens": 190874001.0, + "step": 80710 + }, + { + "epoch": 0.7400751810763729, + "learning_rate": 5.198679746951499e-05, + "loss": 0.6745, + "mean_token_accuracy": 0.7865762948989868, + "num_tokens": 190899139.0, + "step": 80720 + }, + { + "epoch": 0.7401668653158522, + "learning_rate": 5.196846062161914e-05, + "loss": 0.6584, + "mean_token_accuracy": 0.7981809079647064, + "num_tokens": 190924074.0, + "step": 80730 + }, + { + "epoch": 0.7402585495553314, + "learning_rate": 5.19501237737233e-05, + "loss": 0.6772, + "mean_token_accuracy": 0.7952097833156586, + "num_tokens": 190949958.0, + "step": 80740 + }, + { + "epoch": 0.7403502337948107, + "learning_rate": 5.1931786925827453e-05, + "loss": 0.7061, + "mean_token_accuracy": 0.7916275203227997, + "num_tokens": 190975420.0, + "step": 80750 + }, + { + "epoch": 0.7404419180342899, + "learning_rate": 5.1913450077931605e-05, + "loss": 0.6635, + "mean_token_accuracy": 0.7918824315071106, + "num_tokens": 191000167.0, + "step": 80760 + }, + { + "epoch": 0.7405336022737692, + "learning_rate": 5.1895113230035764e-05, + "loss": 0.6711, + "mean_token_accuracy": 0.7908523559570313, + "num_tokens": 191024939.0, + "step": 80770 + }, + { + "epoch": 0.7406252865132483, + "learning_rate": 5.1876776382139916e-05, + "loss": 0.667, + "mean_token_accuracy": 0.8000496864318848, + "num_tokens": 191050622.0, + "step": 80780 + }, + { + "epoch": 0.7407169707527276, + "learning_rate": 5.185843953424406e-05, + "loss": 0.626, + "mean_token_accuracy": 0.8028790414333343, + "num_tokens": 191076075.0, + "step": 80790 + }, + { + "epoch": 0.7408086549922068, + "learning_rate": 5.1840102686348226e-05, + "loss": 0.7181, + "mean_token_accuracy": 0.7822464406490326, + "num_tokens": 191101571.0, + "step": 80800 + }, + { + "epoch": 0.7409003392316861, + "learning_rate": 5.182176583845237e-05, + "loss": 0.6393, + "mean_token_accuracy": 0.800845468044281, + "num_tokens": 191126630.0, + "step": 80810 + }, + { + "epoch": 0.7409920234711653, + "learning_rate": 5.180342899055652e-05, + "loss": 0.6678, + "mean_token_accuracy": 0.7918784499168396, + "num_tokens": 191151715.0, + "step": 80820 + }, + { + "epoch": 0.7410837077106446, + "learning_rate": 5.1785092142660675e-05, + "loss": 0.6951, + "mean_token_accuracy": 0.7841989398002625, + "num_tokens": 191176017.0, + "step": 80830 + }, + { + "epoch": 0.7411753919501237, + "learning_rate": 5.1766755294764834e-05, + "loss": 0.6798, + "mean_token_accuracy": 0.7880084216594696, + "num_tokens": 191201586.0, + "step": 80840 + }, + { + "epoch": 0.741267076189603, + "learning_rate": 5.1748418446868986e-05, + "loss": 0.6921, + "mean_token_accuracy": 0.7903082966804504, + "num_tokens": 191225840.0, + "step": 80850 + }, + { + "epoch": 0.7413587604290822, + "learning_rate": 5.173008159897314e-05, + "loss": 0.7165, + "mean_token_accuracy": 0.7847334921360016, + "num_tokens": 191251739.0, + "step": 80860 + }, + { + "epoch": 0.7414504446685615, + "learning_rate": 5.1711744751077296e-05, + "loss": 0.6817, + "mean_token_accuracy": 0.787997943162918, + "num_tokens": 191276880.0, + "step": 80870 + }, + { + "epoch": 0.7415421289080407, + "learning_rate": 5.169340790318145e-05, + "loss": 0.6506, + "mean_token_accuracy": 0.7952578723430633, + "num_tokens": 191302208.0, + "step": 80880 + }, + { + "epoch": 0.74163381314752, + "learning_rate": 5.167507105528559e-05, + "loss": 0.6663, + "mean_token_accuracy": 0.7942912399768829, + "num_tokens": 191327867.0, + "step": 80890 + }, + { + "epoch": 0.7417254973869992, + "learning_rate": 5.165673420738976e-05, + "loss": 0.6645, + "mean_token_accuracy": 0.7928799092769623, + "num_tokens": 191352428.0, + "step": 80900 + }, + { + "epoch": 0.7418171816264784, + "learning_rate": 5.1638397359493904e-05, + "loss": 0.7115, + "mean_token_accuracy": 0.7827491044998169, + "num_tokens": 191378634.0, + "step": 80910 + }, + { + "epoch": 0.7419088658659576, + "learning_rate": 5.1620060511598055e-05, + "loss": 0.718, + "mean_token_accuracy": 0.7823315680027008, + "num_tokens": 191403429.0, + "step": 80920 + }, + { + "epoch": 0.7420005501054369, + "learning_rate": 5.1601723663702214e-05, + "loss": 0.6668, + "mean_token_accuracy": 0.7925114870071411, + "num_tokens": 191428721.0, + "step": 80930 + }, + { + "epoch": 0.7420922343449161, + "learning_rate": 5.1583386815806366e-05, + "loss": 0.6859, + "mean_token_accuracy": 0.78622407913208, + "num_tokens": 191453870.0, + "step": 80940 + }, + { + "epoch": 0.7421839185843954, + "learning_rate": 5.156504996791052e-05, + "loss": 0.6847, + "mean_token_accuracy": 0.7923462331295014, + "num_tokens": 191479112.0, + "step": 80950 + }, + { + "epoch": 0.7422756028238746, + "learning_rate": 5.154671312001467e-05, + "loss": 0.7193, + "mean_token_accuracy": 0.7837464988231659, + "num_tokens": 191505489.0, + "step": 80960 + }, + { + "epoch": 0.7423672870633539, + "learning_rate": 5.152837627211883e-05, + "loss": 0.7645, + "mean_token_accuracy": 0.7756374478340149, + "num_tokens": 191531165.0, + "step": 80970 + }, + { + "epoch": 0.742458971302833, + "learning_rate": 5.151003942422298e-05, + "loss": 0.6538, + "mean_token_accuracy": 0.800909286737442, + "num_tokens": 191556349.0, + "step": 80980 + }, + { + "epoch": 0.7425506555423123, + "learning_rate": 5.1491702576327125e-05, + "loss": 0.7393, + "mean_token_accuracy": 0.7746599197387696, + "num_tokens": 191582371.0, + "step": 80990 + }, + { + "epoch": 0.7426423397817915, + "learning_rate": 5.147336572843129e-05, + "loss": 0.738, + "mean_token_accuracy": 0.7749620497226715, + "num_tokens": 191608035.0, + "step": 81000 + }, + { + "epoch": 0.7427340240212708, + "learning_rate": 5.1455028880535436e-05, + "loss": 0.699, + "mean_token_accuracy": 0.7854167759418488, + "num_tokens": 191632882.0, + "step": 81010 + }, + { + "epoch": 0.74282570826075, + "learning_rate": 5.143669203263959e-05, + "loss": 0.6982, + "mean_token_accuracy": 0.7897755622863769, + "num_tokens": 191657882.0, + "step": 81020 + }, + { + "epoch": 0.7429173925002293, + "learning_rate": 5.1418355184743746e-05, + "loss": 0.7065, + "mean_token_accuracy": 0.7861283838748931, + "num_tokens": 191683462.0, + "step": 81030 + }, + { + "epoch": 0.7430090767397084, + "learning_rate": 5.14000183368479e-05, + "loss": 0.732, + "mean_token_accuracy": 0.7773496985435486, + "num_tokens": 191709163.0, + "step": 81040 + }, + { + "epoch": 0.7431007609791876, + "learning_rate": 5.138168148895205e-05, + "loss": 0.711, + "mean_token_accuracy": 0.7879119396209717, + "num_tokens": 191734696.0, + "step": 81050 + }, + { + "epoch": 0.7431924452186669, + "learning_rate": 5.136334464105621e-05, + "loss": 0.715, + "mean_token_accuracy": 0.7803106546401978, + "num_tokens": 191760517.0, + "step": 81060 + }, + { + "epoch": 0.7432841294581461, + "learning_rate": 5.134500779316036e-05, + "loss": 0.7087, + "mean_token_accuracy": 0.781575471162796, + "num_tokens": 191786137.0, + "step": 81070 + }, + { + "epoch": 0.7433758136976254, + "learning_rate": 5.132667094526451e-05, + "loss": 0.6951, + "mean_token_accuracy": 0.7844762027263641, + "num_tokens": 191812243.0, + "step": 81080 + }, + { + "epoch": 0.7434674979371046, + "learning_rate": 5.130833409736866e-05, + "loss": 0.7159, + "mean_token_accuracy": 0.7803437769412994, + "num_tokens": 191837797.0, + "step": 81090 + }, + { + "epoch": 0.7435591821765839, + "learning_rate": 5.128999724947282e-05, + "loss": 0.7113, + "mean_token_accuracy": 0.7871942818164825, + "num_tokens": 191862973.0, + "step": 81100 + }, + { + "epoch": 0.743650866416063, + "learning_rate": 5.127166040157697e-05, + "loss": 0.6935, + "mean_token_accuracy": 0.784513133764267, + "num_tokens": 191888434.0, + "step": 81110 + }, + { + "epoch": 0.7437425506555423, + "learning_rate": 5.125332355368112e-05, + "loss": 0.6924, + "mean_token_accuracy": 0.7868725597858429, + "num_tokens": 191912876.0, + "step": 81120 + }, + { + "epoch": 0.7438342348950215, + "learning_rate": 5.123498670578528e-05, + "loss": 0.6631, + "mean_token_accuracy": 0.7957233726978302, + "num_tokens": 191938253.0, + "step": 81130 + }, + { + "epoch": 0.7439259191345008, + "learning_rate": 5.121664985788943e-05, + "loss": 0.709, + "mean_token_accuracy": 0.787634426355362, + "num_tokens": 191963475.0, + "step": 81140 + }, + { + "epoch": 0.74401760337398, + "learning_rate": 5.119831300999358e-05, + "loss": 0.7082, + "mean_token_accuracy": 0.7793751299381256, + "num_tokens": 191989423.0, + "step": 81150 + }, + { + "epoch": 0.7441092876134593, + "learning_rate": 5.117997616209774e-05, + "loss": 0.6721, + "mean_token_accuracy": 0.7872091174125672, + "num_tokens": 192015225.0, + "step": 81160 + }, + { + "epoch": 0.7442009718529384, + "learning_rate": 5.116163931420189e-05, + "loss": 0.6879, + "mean_token_accuracy": 0.7934359252452851, + "num_tokens": 192040218.0, + "step": 81170 + }, + { + "epoch": 0.7442926560924177, + "learning_rate": 5.1143302466306045e-05, + "loss": 0.7609, + "mean_token_accuracy": 0.7663623631000519, + "num_tokens": 192066391.0, + "step": 81180 + }, + { + "epoch": 0.7443843403318969, + "learning_rate": 5.11249656184102e-05, + "loss": 0.7058, + "mean_token_accuracy": 0.7837217688560486, + "num_tokens": 192091329.0, + "step": 81190 + }, + { + "epoch": 0.7444760245713762, + "learning_rate": 5.1106628770514355e-05, + "loss": 0.6478, + "mean_token_accuracy": 0.7939362585544586, + "num_tokens": 192116864.0, + "step": 81200 + }, + { + "epoch": 0.7445677088108554, + "learning_rate": 5.10882919226185e-05, + "loss": 0.7065, + "mean_token_accuracy": 0.7797066390514373, + "num_tokens": 192142193.0, + "step": 81210 + }, + { + "epoch": 0.7446593930503347, + "learning_rate": 5.106995507472265e-05, + "loss": 0.69, + "mean_token_accuracy": 0.7788159012794494, + "num_tokens": 192166842.0, + "step": 81220 + }, + { + "epoch": 0.7447510772898139, + "learning_rate": 5.105161822682681e-05, + "loss": 0.7078, + "mean_token_accuracy": 0.7824737727642059, + "num_tokens": 192192793.0, + "step": 81230 + }, + { + "epoch": 0.7448427615292931, + "learning_rate": 5.103328137893096e-05, + "loss": 0.7076, + "mean_token_accuracy": 0.7827406227588654, + "num_tokens": 192217991.0, + "step": 81240 + }, + { + "epoch": 0.7449344457687723, + "learning_rate": 5.1014944531035115e-05, + "loss": 0.6649, + "mean_token_accuracy": 0.7950560629367829, + "num_tokens": 192243524.0, + "step": 81250 + }, + { + "epoch": 0.7450261300082516, + "learning_rate": 5.099660768313927e-05, + "loss": 0.6779, + "mean_token_accuracy": 0.7937249064445495, + "num_tokens": 192269617.0, + "step": 81260 + }, + { + "epoch": 0.7451178142477308, + "learning_rate": 5.0978270835243425e-05, + "loss": 0.6857, + "mean_token_accuracy": 0.7913187861442565, + "num_tokens": 192294719.0, + "step": 81270 + }, + { + "epoch": 0.7452094984872101, + "learning_rate": 5.095993398734758e-05, + "loss": 0.74, + "mean_token_accuracy": 0.7766092956066132, + "num_tokens": 192320843.0, + "step": 81280 + }, + { + "epoch": 0.7453011827266893, + "learning_rate": 5.0941597139451736e-05, + "loss": 0.687, + "mean_token_accuracy": 0.7891350746154785, + "num_tokens": 192346091.0, + "step": 81290 + }, + { + "epoch": 0.7453928669661685, + "learning_rate": 5.092326029155589e-05, + "loss": 0.7044, + "mean_token_accuracy": 0.7799795985221862, + "num_tokens": 192371537.0, + "step": 81300 + }, + { + "epoch": 0.7454845512056477, + "learning_rate": 5.090492344366003e-05, + "loss": 0.6818, + "mean_token_accuracy": 0.7914417624473572, + "num_tokens": 192397037.0, + "step": 81310 + }, + { + "epoch": 0.745576235445127, + "learning_rate": 5.0886586595764184e-05, + "loss": 0.7279, + "mean_token_accuracy": 0.7714911818504333, + "num_tokens": 192423175.0, + "step": 81320 + }, + { + "epoch": 0.7456679196846062, + "learning_rate": 5.086824974786834e-05, + "loss": 0.7194, + "mean_token_accuracy": 0.7792998969554901, + "num_tokens": 192448252.0, + "step": 81330 + }, + { + "epoch": 0.7457596039240855, + "learning_rate": 5.0849912899972495e-05, + "loss": 0.7337, + "mean_token_accuracy": 0.7705634891986847, + "num_tokens": 192474216.0, + "step": 81340 + }, + { + "epoch": 0.7458512881635647, + "learning_rate": 5.083157605207665e-05, + "loss": 0.7424, + "mean_token_accuracy": 0.7710492253303528, + "num_tokens": 192500074.0, + "step": 81350 + }, + { + "epoch": 0.745942972403044, + "learning_rate": 5.0813239204180805e-05, + "loss": 0.6846, + "mean_token_accuracy": 0.7872656166553498, + "num_tokens": 192524546.0, + "step": 81360 + }, + { + "epoch": 0.7460346566425231, + "learning_rate": 5.079490235628496e-05, + "loss": 0.6398, + "mean_token_accuracy": 0.7989014267921448, + "num_tokens": 192548585.0, + "step": 81370 + }, + { + "epoch": 0.7461263408820024, + "learning_rate": 5.077656550838911e-05, + "loss": 0.6677, + "mean_token_accuracy": 0.7930905401706696, + "num_tokens": 192573340.0, + "step": 81380 + }, + { + "epoch": 0.7462180251214816, + "learning_rate": 5.075822866049327e-05, + "loss": 0.7075, + "mean_token_accuracy": 0.7884686052799225, + "num_tokens": 192598768.0, + "step": 81390 + }, + { + "epoch": 0.7463097093609609, + "learning_rate": 5.073989181259742e-05, + "loss": 0.6599, + "mean_token_accuracy": 0.796476936340332, + "num_tokens": 192624715.0, + "step": 81400 + }, + { + "epoch": 0.7464013936004401, + "learning_rate": 5.0721554964701565e-05, + "loss": 0.7241, + "mean_token_accuracy": 0.7784188091754913, + "num_tokens": 192649733.0, + "step": 81410 + }, + { + "epoch": 0.7464930778399194, + "learning_rate": 5.070321811680573e-05, + "loss": 0.6986, + "mean_token_accuracy": 0.7878309786319733, + "num_tokens": 192675901.0, + "step": 81420 + }, + { + "epoch": 0.7465847620793985, + "learning_rate": 5.0684881268909875e-05, + "loss": 0.6701, + "mean_token_accuracy": 0.7902319371700287, + "num_tokens": 192700966.0, + "step": 81430 + }, + { + "epoch": 0.7466764463188778, + "learning_rate": 5.066654442101403e-05, + "loss": 0.7343, + "mean_token_accuracy": 0.7827136933803558, + "num_tokens": 192725850.0, + "step": 81440 + }, + { + "epoch": 0.746768130558357, + "learning_rate": 5.064820757311818e-05, + "loss": 0.6962, + "mean_token_accuracy": 0.7829465329647064, + "num_tokens": 192751309.0, + "step": 81450 + }, + { + "epoch": 0.7468598147978363, + "learning_rate": 5.062987072522234e-05, + "loss": 0.7434, + "mean_token_accuracy": 0.7767478287220001, + "num_tokens": 192776640.0, + "step": 81460 + }, + { + "epoch": 0.7469514990373155, + "learning_rate": 5.061153387732649e-05, + "loss": 0.7085, + "mean_token_accuracy": 0.7855776369571685, + "num_tokens": 192802231.0, + "step": 81470 + }, + { + "epoch": 0.7470431832767948, + "learning_rate": 5.059319702943064e-05, + "loss": 0.7769, + "mean_token_accuracy": 0.764584481716156, + "num_tokens": 192828243.0, + "step": 81480 + }, + { + "epoch": 0.747134867516274, + "learning_rate": 5.05748601815348e-05, + "loss": 0.6605, + "mean_token_accuracy": 0.7890223801136017, + "num_tokens": 192853669.0, + "step": 81490 + }, + { + "epoch": 0.7472265517557531, + "learning_rate": 5.055652333363895e-05, + "loss": 0.7202, + "mean_token_accuracy": 0.7801950812339783, + "num_tokens": 192879309.0, + "step": 81500 + }, + { + "epoch": 0.7473182359952324, + "learning_rate": 5.05381864857431e-05, + "loss": 0.7504, + "mean_token_accuracy": 0.7756495952606202, + "num_tokens": 192905080.0, + "step": 81510 + }, + { + "epoch": 0.7474099202347116, + "learning_rate": 5.051984963784726e-05, + "loss": 0.8258, + "mean_token_accuracy": 0.7540276765823364, + "num_tokens": 192931322.0, + "step": 81520 + }, + { + "epoch": 0.7475016044741909, + "learning_rate": 5.050151278995141e-05, + "loss": 0.7431, + "mean_token_accuracy": 0.7807523667812347, + "num_tokens": 192956899.0, + "step": 81530 + }, + { + "epoch": 0.7475932887136701, + "learning_rate": 5.048317594205556e-05, + "loss": 0.7985, + "mean_token_accuracy": 0.7603351235389709, + "num_tokens": 192983812.0, + "step": 81540 + }, + { + "epoch": 0.7476849729531494, + "learning_rate": 5.0464839094159725e-05, + "loss": 0.6954, + "mean_token_accuracy": 0.7857788622379303, + "num_tokens": 193008604.0, + "step": 81550 + }, + { + "epoch": 0.7477766571926285, + "learning_rate": 5.044650224626387e-05, + "loss": 0.7176, + "mean_token_accuracy": 0.7779941558837891, + "num_tokens": 193034820.0, + "step": 81560 + }, + { + "epoch": 0.7478683414321078, + "learning_rate": 5.042816539836802e-05, + "loss": 0.7774, + "mean_token_accuracy": 0.772507619857788, + "num_tokens": 193061170.0, + "step": 81570 + }, + { + "epoch": 0.747960025671587, + "learning_rate": 5.0409828550472174e-05, + "loss": 0.6938, + "mean_token_accuracy": 0.785056871175766, + "num_tokens": 193086556.0, + "step": 81580 + }, + { + "epoch": 0.7480517099110663, + "learning_rate": 5.039149170257633e-05, + "loss": 0.8707, + "mean_token_accuracy": 0.7458867251873016, + "num_tokens": 193113779.0, + "step": 81590 + }, + { + "epoch": 0.7481433941505455, + "learning_rate": 5.0373154854680484e-05, + "loss": 0.7181, + "mean_token_accuracy": 0.7856736123561859, + "num_tokens": 193140171.0, + "step": 81600 + }, + { + "epoch": 0.7482350783900248, + "learning_rate": 5.035481800678463e-05, + "loss": 0.6818, + "mean_token_accuracy": 0.7914603292942047, + "num_tokens": 193165390.0, + "step": 81610 + }, + { + "epoch": 0.748326762629504, + "learning_rate": 5.0336481158888795e-05, + "loss": 0.6895, + "mean_token_accuracy": 0.7843019604682923, + "num_tokens": 193192098.0, + "step": 81620 + }, + { + "epoch": 0.7484184468689832, + "learning_rate": 5.031814431099294e-05, + "loss": 0.7608, + "mean_token_accuracy": 0.7733224153518676, + "num_tokens": 193217305.0, + "step": 81630 + }, + { + "epoch": 0.7485101311084624, + "learning_rate": 5.029980746309709e-05, + "loss": 0.8569, + "mean_token_accuracy": 0.74853515625, + "num_tokens": 193245930.0, + "step": 81640 + }, + { + "epoch": 0.7486018153479417, + "learning_rate": 5.028147061520126e-05, + "loss": 0.7385, + "mean_token_accuracy": 0.7779390633106231, + "num_tokens": 193272335.0, + "step": 81650 + }, + { + "epoch": 0.7486934995874209, + "learning_rate": 5.02631337673054e-05, + "loss": 0.7516, + "mean_token_accuracy": 0.7716957569122315, + "num_tokens": 193298482.0, + "step": 81660 + }, + { + "epoch": 0.7487851838269002, + "learning_rate": 5.0244796919409554e-05, + "loss": 0.6871, + "mean_token_accuracy": 0.7878741502761841, + "num_tokens": 193323393.0, + "step": 81670 + }, + { + "epoch": 0.7488768680663794, + "learning_rate": 5.022646007151371e-05, + "loss": 0.7245, + "mean_token_accuracy": 0.7755094230175018, + "num_tokens": 193348487.0, + "step": 81680 + }, + { + "epoch": 0.7489685523058586, + "learning_rate": 5.0208123223617864e-05, + "loss": 0.7531, + "mean_token_accuracy": 0.7713774621486664, + "num_tokens": 193373605.0, + "step": 81690 + }, + { + "epoch": 0.7490602365453378, + "learning_rate": 5.0189786375722016e-05, + "loss": 0.8449, + "mean_token_accuracy": 0.750771677494049, + "num_tokens": 193402804.0, + "step": 81700 + }, + { + "epoch": 0.7491519207848171, + "learning_rate": 5.017144952782616e-05, + "loss": 0.7251, + "mean_token_accuracy": 0.7795206308364868, + "num_tokens": 193428268.0, + "step": 81710 + }, + { + "epoch": 0.7492436050242963, + "learning_rate": 5.015311267993033e-05, + "loss": 0.8024, + "mean_token_accuracy": 0.7697794437408447, + "num_tokens": 193454181.0, + "step": 81720 + }, + { + "epoch": 0.7493352892637756, + "learning_rate": 5.013477583203447e-05, + "loss": 0.7583, + "mean_token_accuracy": 0.7685450136661529, + "num_tokens": 193480553.0, + "step": 81730 + }, + { + "epoch": 0.7494269735032548, + "learning_rate": 5.0116438984138624e-05, + "loss": 0.7514, + "mean_token_accuracy": 0.7715674877166748, + "num_tokens": 193507507.0, + "step": 81740 + }, + { + "epoch": 0.7495186577427341, + "learning_rate": 5.009810213624279e-05, + "loss": 0.7634, + "mean_token_accuracy": 0.7732964396476746, + "num_tokens": 193534341.0, + "step": 81750 + }, + { + "epoch": 0.7496103419822132, + "learning_rate": 5.0079765288346934e-05, + "loss": 0.7842, + "mean_token_accuracy": 0.7643706262111664, + "num_tokens": 193561440.0, + "step": 81760 + }, + { + "epoch": 0.7497020262216925, + "learning_rate": 5.0061428440451086e-05, + "loss": 0.8439, + "mean_token_accuracy": 0.7495325326919555, + "num_tokens": 193590705.0, + "step": 81770 + }, + { + "epoch": 0.7497937104611717, + "learning_rate": 5.0043091592555245e-05, + "loss": 0.6869, + "mean_token_accuracy": 0.7873552143573761, + "num_tokens": 193616380.0, + "step": 81780 + }, + { + "epoch": 0.749885394700651, + "learning_rate": 5.00247547446594e-05, + "loss": 0.7524, + "mean_token_accuracy": 0.7729937136173248, + "num_tokens": 193640836.0, + "step": 81790 + }, + { + "epoch": 0.7499770789401302, + "learning_rate": 5.000641789676355e-05, + "loss": 0.793, + "mean_token_accuracy": 0.7657868981361389, + "num_tokens": 193667721.0, + "step": 81800 + }, + { + "epoch": 0.7500687631796095, + "learning_rate": 4.99880810488677e-05, + "loss": 0.806, + "mean_token_accuracy": 0.7578528225421906, + "num_tokens": 193694718.0, + "step": 81810 + }, + { + "epoch": 0.7501604474190886, + "learning_rate": 4.996974420097186e-05, + "loss": 0.7636, + "mean_token_accuracy": 0.7735159158706665, + "num_tokens": 193720375.0, + "step": 81820 + }, + { + "epoch": 0.7502521316585679, + "learning_rate": 4.9951407353076004e-05, + "loss": 0.6742, + "mean_token_accuracy": 0.7935140013694764, + "num_tokens": 193746126.0, + "step": 81830 + }, + { + "epoch": 0.7503438158980471, + "learning_rate": 4.993307050518016e-05, + "loss": 0.8474, + "mean_token_accuracy": 0.7509146213531495, + "num_tokens": 193774702.0, + "step": 81840 + }, + { + "epoch": 0.7504355001375264, + "learning_rate": 4.9914733657284315e-05, + "loss": 0.7746, + "mean_token_accuracy": 0.7741905748844147, + "num_tokens": 193800746.0, + "step": 81850 + }, + { + "epoch": 0.7505271843770056, + "learning_rate": 4.9896396809388467e-05, + "loss": 0.7429, + "mean_token_accuracy": 0.7753175258636474, + "num_tokens": 193827327.0, + "step": 81860 + }, + { + "epoch": 0.7506188686164849, + "learning_rate": 4.9878059961492625e-05, + "loss": 0.7318, + "mean_token_accuracy": 0.7754132926464081, + "num_tokens": 193853189.0, + "step": 81870 + }, + { + "epoch": 0.7507105528559641, + "learning_rate": 4.985972311359677e-05, + "loss": 0.6884, + "mean_token_accuracy": 0.7916352927684784, + "num_tokens": 193879486.0, + "step": 81880 + }, + { + "epoch": 0.7508022370954432, + "learning_rate": 4.984138626570093e-05, + "loss": 0.8695, + "mean_token_accuracy": 0.7477820873260498, + "num_tokens": 193908094.0, + "step": 81890 + }, + { + "epoch": 0.7508939213349225, + "learning_rate": 4.982304941780509e-05, + "loss": 0.8587, + "mean_token_accuracy": 0.749259614944458, + "num_tokens": 193936986.0, + "step": 81900 + }, + { + "epoch": 0.7509856055744017, + "learning_rate": 4.980471256990923e-05, + "loss": 0.7081, + "mean_token_accuracy": 0.7845314800739288, + "num_tokens": 193963648.0, + "step": 81910 + }, + { + "epoch": 0.751077289813881, + "learning_rate": 4.978637572201339e-05, + "loss": 0.7839, + "mean_token_accuracy": 0.7613317847251893, + "num_tokens": 193989812.0, + "step": 81920 + }, + { + "epoch": 0.7511689740533602, + "learning_rate": 4.9768038874117536e-05, + "loss": 0.7988, + "mean_token_accuracy": 0.7601967811584472, + "num_tokens": 194017550.0, + "step": 81930 + }, + { + "epoch": 0.7512606582928395, + "learning_rate": 4.9749702026221695e-05, + "loss": 0.7725, + "mean_token_accuracy": 0.7678104877471924, + "num_tokens": 194044106.0, + "step": 81940 + }, + { + "epoch": 0.7513523425323186, + "learning_rate": 4.9731365178325854e-05, + "loss": 0.7516, + "mean_token_accuracy": 0.7737136840820312, + "num_tokens": 194070051.0, + "step": 81950 + }, + { + "epoch": 0.7514440267717979, + "learning_rate": 4.971302833043e-05, + "loss": 0.8265, + "mean_token_accuracy": 0.7505439996719361, + "num_tokens": 194098289.0, + "step": 81960 + }, + { + "epoch": 0.7515357110112771, + "learning_rate": 4.969469148253416e-05, + "loss": 0.7109, + "mean_token_accuracy": 0.7753967463970184, + "num_tokens": 194124068.0, + "step": 81970 + }, + { + "epoch": 0.7516273952507564, + "learning_rate": 4.96763546346383e-05, + "loss": 0.7599, + "mean_token_accuracy": 0.769416093826294, + "num_tokens": 194150676.0, + "step": 81980 + }, + { + "epoch": 0.7517190794902356, + "learning_rate": 4.965801778674246e-05, + "loss": 0.8358, + "mean_token_accuracy": 0.747289651632309, + "num_tokens": 194179280.0, + "step": 81990 + }, + { + "epoch": 0.7518107637297149, + "learning_rate": 4.963968093884662e-05, + "loss": 0.8271, + "mean_token_accuracy": 0.7535883486270905, + "num_tokens": 194207018.0, + "step": 82000 + }, + { + "epoch": 0.7519024479691941, + "learning_rate": 4.9621344090950765e-05, + "loss": 0.9148, + "mean_token_accuracy": 0.7365788459777832, + "num_tokens": 194236736.0, + "step": 82010 + }, + { + "epoch": 0.7519941322086733, + "learning_rate": 4.9603007243054924e-05, + "loss": 0.8665, + "mean_token_accuracy": 0.7488987386226654, + "num_tokens": 194264334.0, + "step": 82020 + }, + { + "epoch": 0.7520858164481525, + "learning_rate": 4.958467039515907e-05, + "loss": 0.7868, + "mean_token_accuracy": 0.7618037223815918, + "num_tokens": 194291772.0, + "step": 82030 + }, + { + "epoch": 0.7521775006876318, + "learning_rate": 4.956633354726323e-05, + "loss": 0.7589, + "mean_token_accuracy": 0.7747104287147522, + "num_tokens": 194318381.0, + "step": 82040 + }, + { + "epoch": 0.752269184927111, + "learning_rate": 4.9547996699367386e-05, + "loss": 0.7958, + "mean_token_accuracy": 0.760222977399826, + "num_tokens": 194346059.0, + "step": 82050 + }, + { + "epoch": 0.7523608691665903, + "learning_rate": 4.952965985147153e-05, + "loss": 0.8587, + "mean_token_accuracy": 0.7498927354812622, + "num_tokens": 194373753.0, + "step": 82060 + }, + { + "epoch": 0.7524525534060695, + "learning_rate": 4.951132300357569e-05, + "loss": 0.6909, + "mean_token_accuracy": 0.7929769337177277, + "num_tokens": 194399024.0, + "step": 82070 + }, + { + "epoch": 0.7525442376455487, + "learning_rate": 4.949298615567984e-05, + "loss": 0.7802, + "mean_token_accuracy": 0.7730043709278107, + "num_tokens": 194425365.0, + "step": 82080 + }, + { + "epoch": 0.7526359218850279, + "learning_rate": 4.947464930778399e-05, + "loss": 0.7663, + "mean_token_accuracy": 0.7677356362342834, + "num_tokens": 194451118.0, + "step": 82090 + }, + { + "epoch": 0.7527276061245072, + "learning_rate": 4.945631245988815e-05, + "loss": 0.7588, + "mean_token_accuracy": 0.7705836236476898, + "num_tokens": 194477681.0, + "step": 82100 + }, + { + "epoch": 0.7528192903639864, + "learning_rate": 4.94379756119923e-05, + "loss": 0.7471, + "mean_token_accuracy": 0.7777624130249023, + "num_tokens": 194504189.0, + "step": 82110 + }, + { + "epoch": 0.7529109746034657, + "learning_rate": 4.9419638764096456e-05, + "loss": 0.884, + "mean_token_accuracy": 0.7406049251556397, + "num_tokens": 194532981.0, + "step": 82120 + }, + { + "epoch": 0.7530026588429449, + "learning_rate": 4.940130191620061e-05, + "loss": 0.8126, + "mean_token_accuracy": 0.7547918617725372, + "num_tokens": 194560608.0, + "step": 82130 + }, + { + "epoch": 0.7530943430824242, + "learning_rate": 4.938296506830476e-05, + "loss": 0.8782, + "mean_token_accuracy": 0.7428805947303772, + "num_tokens": 194588926.0, + "step": 82140 + }, + { + "epoch": 0.7531860273219033, + "learning_rate": 4.936462822040892e-05, + "loss": 0.7559, + "mean_token_accuracy": 0.7802633821964264, + "num_tokens": 194613475.0, + "step": 82150 + }, + { + "epoch": 0.7532777115613826, + "learning_rate": 4.934629137251306e-05, + "loss": 0.7837, + "mean_token_accuracy": 0.7672086238861084, + "num_tokens": 194640374.0, + "step": 82160 + }, + { + "epoch": 0.7533693958008618, + "learning_rate": 4.932795452461722e-05, + "loss": 0.8208, + "mean_token_accuracy": 0.7582300066947937, + "num_tokens": 194668213.0, + "step": 82170 + }, + { + "epoch": 0.7534610800403411, + "learning_rate": 4.9309617676721374e-05, + "loss": 0.937, + "mean_token_accuracy": 0.7293002188205719, + "num_tokens": 194698994.0, + "step": 82180 + }, + { + "epoch": 0.7535527642798203, + "learning_rate": 4.9291280828825526e-05, + "loss": 0.8646, + "mean_token_accuracy": 0.7472356975078582, + "num_tokens": 194727596.0, + "step": 82190 + }, + { + "epoch": 0.7536444485192996, + "learning_rate": 4.9272943980929684e-05, + "loss": 0.8644, + "mean_token_accuracy": 0.7457275450229645, + "num_tokens": 194755504.0, + "step": 82200 + }, + { + "epoch": 0.7537361327587788, + "learning_rate": 4.9254607133033836e-05, + "loss": 0.7907, + "mean_token_accuracy": 0.7620010018348694, + "num_tokens": 194781799.0, + "step": 82210 + }, + { + "epoch": 0.753827816998258, + "learning_rate": 4.923627028513799e-05, + "loss": 0.8128, + "mean_token_accuracy": 0.7590906023979187, + "num_tokens": 194808353.0, + "step": 82220 + }, + { + "epoch": 0.7539195012377372, + "learning_rate": 4.921793343724214e-05, + "loss": 0.811, + "mean_token_accuracy": 0.7560511231422424, + "num_tokens": 194836071.0, + "step": 82230 + }, + { + "epoch": 0.7540111854772165, + "learning_rate": 4.919959658934629e-05, + "loss": 0.831, + "mean_token_accuracy": 0.7527174770832061, + "num_tokens": 194864236.0, + "step": 82240 + }, + { + "epoch": 0.7541028697166957, + "learning_rate": 4.918125974145045e-05, + "loss": 0.8575, + "mean_token_accuracy": 0.7455669045448303, + "num_tokens": 194893911.0, + "step": 82250 + }, + { + "epoch": 0.754194553956175, + "learning_rate": 4.91629228935546e-05, + "loss": 0.8665, + "mean_token_accuracy": 0.7482231497764588, + "num_tokens": 194922090.0, + "step": 82260 + }, + { + "epoch": 0.7542862381956542, + "learning_rate": 4.9144586045658754e-05, + "loss": 0.7877, + "mean_token_accuracy": 0.7638835310935974, + "num_tokens": 194950326.0, + "step": 82270 + }, + { + "epoch": 0.7543779224351334, + "learning_rate": 4.9126249197762906e-05, + "loss": 0.7719, + "mean_token_accuracy": 0.7675490319728852, + "num_tokens": 194978589.0, + "step": 82280 + }, + { + "epoch": 0.7544696066746126, + "learning_rate": 4.910791234986706e-05, + "loss": 0.772, + "mean_token_accuracy": 0.773044204711914, + "num_tokens": 195005342.0, + "step": 82290 + }, + { + "epoch": 0.7545612909140919, + "learning_rate": 4.9089575501971216e-05, + "loss": 0.8271, + "mean_token_accuracy": 0.7553254723548889, + "num_tokens": 195033339.0, + "step": 82300 + }, + { + "epoch": 0.7546529751535711, + "learning_rate": 4.907123865407537e-05, + "loss": 0.8204, + "mean_token_accuracy": 0.7502288699150086, + "num_tokens": 195062836.0, + "step": 82310 + }, + { + "epoch": 0.7547446593930504, + "learning_rate": 4.905290180617952e-05, + "loss": 0.7888, + "mean_token_accuracy": 0.7607177436351776, + "num_tokens": 195089469.0, + "step": 82320 + }, + { + "epoch": 0.7548363436325296, + "learning_rate": 4.903456495828367e-05, + "loss": 0.7779, + "mean_token_accuracy": 0.7668349742889404, + "num_tokens": 195115880.0, + "step": 82330 + }, + { + "epoch": 0.7549280278720089, + "learning_rate": 4.9016228110387824e-05, + "loss": 0.7597, + "mean_token_accuracy": 0.768760347366333, + "num_tokens": 195142804.0, + "step": 82340 + }, + { + "epoch": 0.755019712111488, + "learning_rate": 4.899789126249198e-05, + "loss": 0.8594, + "mean_token_accuracy": 0.7467792809009552, + "num_tokens": 195170419.0, + "step": 82350 + }, + { + "epoch": 0.7551113963509672, + "learning_rate": 4.8979554414596134e-05, + "loss": 0.7737, + "mean_token_accuracy": 0.7684077203273774, + "num_tokens": 195197127.0, + "step": 82360 + }, + { + "epoch": 0.7552030805904465, + "learning_rate": 4.8961217566700286e-05, + "loss": 0.8452, + "mean_token_accuracy": 0.7499734938144684, + "num_tokens": 195225039.0, + "step": 82370 + }, + { + "epoch": 0.7552947648299257, + "learning_rate": 4.894288071880444e-05, + "loss": 0.8044, + "mean_token_accuracy": 0.7629131078720093, + "num_tokens": 195252697.0, + "step": 82380 + }, + { + "epoch": 0.755386449069405, + "learning_rate": 4.89245438709086e-05, + "loss": 0.8057, + "mean_token_accuracy": 0.7554194688796997, + "num_tokens": 195280706.0, + "step": 82390 + }, + { + "epoch": 0.7554781333088842, + "learning_rate": 4.890620702301275e-05, + "loss": 0.8122, + "mean_token_accuracy": 0.7619563937187195, + "num_tokens": 195309976.0, + "step": 82400 + }, + { + "epoch": 0.7555698175483634, + "learning_rate": 4.88878701751169e-05, + "loss": 0.8602, + "mean_token_accuracy": 0.7478345215320588, + "num_tokens": 195340195.0, + "step": 82410 + }, + { + "epoch": 0.7556615017878426, + "learning_rate": 4.886953332722105e-05, + "loss": 0.8824, + "mean_token_accuracy": 0.7405252516269684, + "num_tokens": 195369556.0, + "step": 82420 + }, + { + "epoch": 0.7557531860273219, + "learning_rate": 4.8851196479325204e-05, + "loss": 0.959, + "mean_token_accuracy": 0.7258198380470275, + "num_tokens": 195400518.0, + "step": 82430 + }, + { + "epoch": 0.7558448702668011, + "learning_rate": 4.883285963142936e-05, + "loss": 0.8132, + "mean_token_accuracy": 0.7587051033973694, + "num_tokens": 195427781.0, + "step": 82440 + }, + { + "epoch": 0.7559365545062804, + "learning_rate": 4.8814522783533515e-05, + "loss": 0.8026, + "mean_token_accuracy": 0.7610012650489807, + "num_tokens": 195455949.0, + "step": 82450 + }, + { + "epoch": 0.7560282387457596, + "learning_rate": 4.879618593563767e-05, + "loss": 0.7841, + "mean_token_accuracy": 0.763341772556305, + "num_tokens": 195482634.0, + "step": 82460 + }, + { + "epoch": 0.7561199229852389, + "learning_rate": 4.877784908774182e-05, + "loss": 0.7723, + "mean_token_accuracy": 0.7670092403888702, + "num_tokens": 195508898.0, + "step": 82470 + }, + { + "epoch": 0.756211607224718, + "learning_rate": 4.875951223984597e-05, + "loss": 0.8222, + "mean_token_accuracy": 0.7569530308246613, + "num_tokens": 195536749.0, + "step": 82480 + }, + { + "epoch": 0.7563032914641973, + "learning_rate": 4.874117539195013e-05, + "loss": 0.879, + "mean_token_accuracy": 0.7417121946811676, + "num_tokens": 195568229.0, + "step": 82490 + }, + { + "epoch": 0.7563949757036765, + "learning_rate": 4.872283854405428e-05, + "loss": 0.862, + "mean_token_accuracy": 0.7439973294734955, + "num_tokens": 195596713.0, + "step": 82500 + }, + { + "epoch": 0.7564866599431558, + "learning_rate": 4.870450169615843e-05, + "loss": 0.7791, + "mean_token_accuracy": 0.7655384838581085, + "num_tokens": 195624296.0, + "step": 82510 + }, + { + "epoch": 0.756578344182635, + "learning_rate": 4.868616484826259e-05, + "loss": 0.8227, + "mean_token_accuracy": 0.7539513170719147, + "num_tokens": 195652740.0, + "step": 82520 + }, + { + "epoch": 0.7566700284221143, + "learning_rate": 4.8667828000366737e-05, + "loss": 0.8639, + "mean_token_accuracy": 0.7521308600902558, + "num_tokens": 195681474.0, + "step": 82530 + }, + { + "epoch": 0.7567617126615934, + "learning_rate": 4.8649491152470895e-05, + "loss": 0.8572, + "mean_token_accuracy": 0.7475384712219239, + "num_tokens": 195711310.0, + "step": 82540 + }, + { + "epoch": 0.7568533969010727, + "learning_rate": 4.863115430457505e-05, + "loss": 0.879, + "mean_token_accuracy": 0.7408627092838287, + "num_tokens": 195740761.0, + "step": 82550 + }, + { + "epoch": 0.7569450811405519, + "learning_rate": 4.86128174566792e-05, + "loss": 0.8709, + "mean_token_accuracy": 0.7468157231807708, + "num_tokens": 195769948.0, + "step": 82560 + }, + { + "epoch": 0.7570367653800312, + "learning_rate": 4.859448060878336e-05, + "loss": 0.8252, + "mean_token_accuracy": 0.7560142934322357, + "num_tokens": 195797197.0, + "step": 82570 + }, + { + "epoch": 0.7571284496195104, + "learning_rate": 4.85761437608875e-05, + "loss": 0.7946, + "mean_token_accuracy": 0.7610917687416077, + "num_tokens": 195824521.0, + "step": 82580 + }, + { + "epoch": 0.7572201338589897, + "learning_rate": 4.855780691299166e-05, + "loss": 0.8261, + "mean_token_accuracy": 0.7522114157676697, + "num_tokens": 195852487.0, + "step": 82590 + }, + { + "epoch": 0.7573118180984689, + "learning_rate": 4.853947006509581e-05, + "loss": 0.8967, + "mean_token_accuracy": 0.732669985294342, + "num_tokens": 195880618.0, + "step": 82600 + }, + { + "epoch": 0.7574035023379481, + "learning_rate": 4.8521133217199965e-05, + "loss": 0.7925, + "mean_token_accuracy": 0.7619107902050019, + "num_tokens": 195908327.0, + "step": 82610 + }, + { + "epoch": 0.7574951865774273, + "learning_rate": 4.8502796369304124e-05, + "loss": 0.8886, + "mean_token_accuracy": 0.7358214437961579, + "num_tokens": 195937783.0, + "step": 82620 + }, + { + "epoch": 0.7575868708169066, + "learning_rate": 4.848445952140827e-05, + "loss": 0.7455, + "mean_token_accuracy": 0.7729065895080567, + "num_tokens": 195963372.0, + "step": 82630 + }, + { + "epoch": 0.7576785550563858, + "learning_rate": 4.846612267351243e-05, + "loss": 0.7431, + "mean_token_accuracy": 0.7816286683082581, + "num_tokens": 195989696.0, + "step": 82640 + }, + { + "epoch": 0.7577702392958651, + "learning_rate": 4.844778582561658e-05, + "loss": 0.822, + "mean_token_accuracy": 0.7576343536376953, + "num_tokens": 196018147.0, + "step": 82650 + }, + { + "epoch": 0.7578619235353443, + "learning_rate": 4.842944897772073e-05, + "loss": 0.8433, + "mean_token_accuracy": 0.7488945424556732, + "num_tokens": 196048614.0, + "step": 82660 + }, + { + "epoch": 0.7579536077748235, + "learning_rate": 4.841111212982489e-05, + "loss": 0.8822, + "mean_token_accuracy": 0.7415592491626739, + "num_tokens": 196080408.0, + "step": 82670 + }, + { + "epoch": 0.7580452920143027, + "learning_rate": 4.8392775281929035e-05, + "loss": 0.8703, + "mean_token_accuracy": 0.7413014054298401, + "num_tokens": 196109770.0, + "step": 82680 + }, + { + "epoch": 0.758136976253782, + "learning_rate": 4.8374438434033194e-05, + "loss": 0.7501, + "mean_token_accuracy": 0.7770328938961029, + "num_tokens": 196136569.0, + "step": 82690 + }, + { + "epoch": 0.7582286604932612, + "learning_rate": 4.8356101586137345e-05, + "loss": 0.7632, + "mean_token_accuracy": 0.7713229894638062, + "num_tokens": 196164399.0, + "step": 82700 + }, + { + "epoch": 0.7583203447327405, + "learning_rate": 4.83377647382415e-05, + "loss": 0.8432, + "mean_token_accuracy": 0.7497777819633484, + "num_tokens": 196196164.0, + "step": 82710 + }, + { + "epoch": 0.7584120289722197, + "learning_rate": 4.8319427890345656e-05, + "loss": 0.9047, + "mean_token_accuracy": 0.7338837504386901, + "num_tokens": 196225746.0, + "step": 82720 + }, + { + "epoch": 0.758503713211699, + "learning_rate": 4.83010910424498e-05, + "loss": 0.8781, + "mean_token_accuracy": 0.7373611271381378, + "num_tokens": 196254408.0, + "step": 82730 + }, + { + "epoch": 0.7585953974511781, + "learning_rate": 4.828275419455396e-05, + "loss": 0.8818, + "mean_token_accuracy": 0.7404162049293518, + "num_tokens": 196284528.0, + "step": 82740 + }, + { + "epoch": 0.7586870816906574, + "learning_rate": 4.826441734665811e-05, + "loss": 0.7751, + "mean_token_accuracy": 0.7641188085079194, + "num_tokens": 196312235.0, + "step": 82750 + }, + { + "epoch": 0.7587787659301366, + "learning_rate": 4.824608049876226e-05, + "loss": 0.8109, + "mean_token_accuracy": 0.756779420375824, + "num_tokens": 196340891.0, + "step": 82760 + }, + { + "epoch": 0.7588704501696159, + "learning_rate": 4.822774365086642e-05, + "loss": 0.8108, + "mean_token_accuracy": 0.7533910214900971, + "num_tokens": 196369247.0, + "step": 82770 + }, + { + "epoch": 0.7589621344090951, + "learning_rate": 4.820940680297057e-05, + "loss": 0.8806, + "mean_token_accuracy": 0.7383510410785675, + "num_tokens": 196401289.0, + "step": 82780 + }, + { + "epoch": 0.7590538186485744, + "learning_rate": 4.8191069955074726e-05, + "loss": 0.8864, + "mean_token_accuracy": 0.7434684038162231, + "num_tokens": 196430309.0, + "step": 82790 + }, + { + "epoch": 0.7591455028880535, + "learning_rate": 4.817273310717888e-05, + "loss": 0.9156, + "mean_token_accuracy": 0.7362958908081054, + "num_tokens": 196461997.0, + "step": 82800 + }, + { + "epoch": 0.7592371871275327, + "learning_rate": 4.815439625928303e-05, + "loss": 0.7971, + "mean_token_accuracy": 0.7583592057228088, + "num_tokens": 196489372.0, + "step": 82810 + }, + { + "epoch": 0.759328871367012, + "learning_rate": 4.813605941138719e-05, + "loss": 0.8019, + "mean_token_accuracy": 0.759622585773468, + "num_tokens": 196516849.0, + "step": 82820 + }, + { + "epoch": 0.7594205556064912, + "learning_rate": 4.811772256349134e-05, + "loss": 0.8452, + "mean_token_accuracy": 0.7465933322906494, + "num_tokens": 196545889.0, + "step": 82830 + }, + { + "epoch": 0.7595122398459705, + "learning_rate": 4.809938571559549e-05, + "loss": 0.8452, + "mean_token_accuracy": 0.7508033812046051, + "num_tokens": 196575364.0, + "step": 82840 + }, + { + "epoch": 0.7596039240854497, + "learning_rate": 4.8081048867699644e-05, + "loss": 0.8958, + "mean_token_accuracy": 0.7373965382575989, + "num_tokens": 196604712.0, + "step": 82850 + }, + { + "epoch": 0.759695608324929, + "learning_rate": 4.8062712019803796e-05, + "loss": 0.9364, + "mean_token_accuracy": 0.7314100861549377, + "num_tokens": 196636162.0, + "step": 82860 + }, + { + "epoch": 0.7597872925644081, + "learning_rate": 4.8044375171907954e-05, + "loss": 0.8305, + "mean_token_accuracy": 0.754850035905838, + "num_tokens": 196665750.0, + "step": 82870 + }, + { + "epoch": 0.7598789768038874, + "learning_rate": 4.8026038324012106e-05, + "loss": 0.8319, + "mean_token_accuracy": 0.7528897941112518, + "num_tokens": 196694928.0, + "step": 82880 + }, + { + "epoch": 0.7599706610433666, + "learning_rate": 4.800770147611626e-05, + "loss": 0.8598, + "mean_token_accuracy": 0.7441156387329102, + "num_tokens": 196725611.0, + "step": 82890 + }, + { + "epoch": 0.7600623452828459, + "learning_rate": 4.798936462822041e-05, + "loss": 0.9098, + "mean_token_accuracy": 0.7359290599822998, + "num_tokens": 196756044.0, + "step": 82900 + }, + { + "epoch": 0.7601540295223251, + "learning_rate": 4.797102778032456e-05, + "loss": 0.881, + "mean_token_accuracy": 0.7421162307262421, + "num_tokens": 196786604.0, + "step": 82910 + }, + { + "epoch": 0.7602457137618044, + "learning_rate": 4.795269093242872e-05, + "loss": 0.8285, + "mean_token_accuracy": 0.7487018823623657, + "num_tokens": 196816354.0, + "step": 82920 + }, + { + "epoch": 0.7603373980012835, + "learning_rate": 4.793435408453287e-05, + "loss": 0.8021, + "mean_token_accuracy": 0.7550116896629333, + "num_tokens": 196844974.0, + "step": 82930 + }, + { + "epoch": 0.7604290822407628, + "learning_rate": 4.7916017236637024e-05, + "loss": 0.8017, + "mean_token_accuracy": 0.7594165742397309, + "num_tokens": 196873330.0, + "step": 82940 + }, + { + "epoch": 0.760520766480242, + "learning_rate": 4.7897680388741176e-05, + "loss": 0.8343, + "mean_token_accuracy": 0.7532778263092041, + "num_tokens": 196904073.0, + "step": 82950 + }, + { + "epoch": 0.7606124507197213, + "learning_rate": 4.787934354084533e-05, + "loss": 0.8622, + "mean_token_accuracy": 0.7470668494701386, + "num_tokens": 196934111.0, + "step": 82960 + }, + { + "epoch": 0.7607041349592005, + "learning_rate": 4.7861006692949486e-05, + "loss": 0.8852, + "mean_token_accuracy": 0.7404623091220855, + "num_tokens": 196965605.0, + "step": 82970 + }, + { + "epoch": 0.7607958191986798, + "learning_rate": 4.784266984505364e-05, + "loss": 0.8767, + "mean_token_accuracy": 0.7419257044792176, + "num_tokens": 196996708.0, + "step": 82980 + }, + { + "epoch": 0.760887503438159, + "learning_rate": 4.782433299715779e-05, + "loss": 0.7645, + "mean_token_accuracy": 0.773752760887146, + "num_tokens": 197023533.0, + "step": 82990 + }, + { + "epoch": 0.7609791876776382, + "learning_rate": 4.780599614926194e-05, + "loss": 0.8064, + "mean_token_accuracy": 0.7623594880104065, + "num_tokens": 197050875.0, + "step": 83000 + }, + { + "epoch": 0.7610708719171174, + "learning_rate": 4.77876593013661e-05, + "loss": 0.8016, + "mean_token_accuracy": 0.7565568685531616, + "num_tokens": 197079546.0, + "step": 83010 + }, + { + "epoch": 0.7611625561565967, + "learning_rate": 4.776932245347025e-05, + "loss": 0.8875, + "mean_token_accuracy": 0.737514728307724, + "num_tokens": 197109931.0, + "step": 83020 + }, + { + "epoch": 0.7612542403960759, + "learning_rate": 4.7750985605574404e-05, + "loss": 0.8826, + "mean_token_accuracy": 0.74748295545578, + "num_tokens": 197138034.0, + "step": 83030 + }, + { + "epoch": 0.7613459246355552, + "learning_rate": 4.7732648757678556e-05, + "loss": 0.8664, + "mean_token_accuracy": 0.7447394669055939, + "num_tokens": 197168245.0, + "step": 83040 + }, + { + "epoch": 0.7614376088750344, + "learning_rate": 4.771431190978271e-05, + "loss": 0.7924, + "mean_token_accuracy": 0.7621159255504608, + "num_tokens": 197195422.0, + "step": 83050 + }, + { + "epoch": 0.7615292931145136, + "learning_rate": 4.769597506188687e-05, + "loss": 0.8145, + "mean_token_accuracy": 0.7605322599411011, + "num_tokens": 197223696.0, + "step": 83060 + }, + { + "epoch": 0.7616209773539928, + "learning_rate": 4.767763821399102e-05, + "loss": 0.8269, + "mean_token_accuracy": 0.753108811378479, + "num_tokens": 197252412.0, + "step": 83070 + }, + { + "epoch": 0.7617126615934721, + "learning_rate": 4.765930136609517e-05, + "loss": 0.8927, + "mean_token_accuracy": 0.744899469614029, + "num_tokens": 197283719.0, + "step": 83080 + }, + { + "epoch": 0.7618043458329513, + "learning_rate": 4.764096451819932e-05, + "loss": 0.8821, + "mean_token_accuracy": 0.7437337219715119, + "num_tokens": 197313851.0, + "step": 83090 + }, + { + "epoch": 0.7618960300724306, + "learning_rate": 4.7622627670303474e-05, + "loss": 0.8824, + "mean_token_accuracy": 0.73881094455719, + "num_tokens": 197344418.0, + "step": 83100 + }, + { + "epoch": 0.7619877143119098, + "learning_rate": 4.760429082240763e-05, + "loss": 0.8003, + "mean_token_accuracy": 0.7583040416240692, + "num_tokens": 197373297.0, + "step": 83110 + }, + { + "epoch": 0.7620793985513891, + "learning_rate": 4.7585953974511785e-05, + "loss": 0.826, + "mean_token_accuracy": 0.7492796063423157, + "num_tokens": 197402050.0, + "step": 83120 + }, + { + "epoch": 0.7621710827908682, + "learning_rate": 4.756761712661594e-05, + "loss": 0.8339, + "mean_token_accuracy": 0.7554567039012909, + "num_tokens": 197431839.0, + "step": 83130 + }, + { + "epoch": 0.7622627670303475, + "learning_rate": 4.7549280278720095e-05, + "loss": 0.8877, + "mean_token_accuracy": 0.735871410369873, + "num_tokens": 197461976.0, + "step": 83140 + }, + { + "epoch": 0.7623544512698267, + "learning_rate": 4.753094343082424e-05, + "loss": 0.8506, + "mean_token_accuracy": 0.7509628176689148, + "num_tokens": 197491842.0, + "step": 83150 + }, + { + "epoch": 0.762446135509306, + "learning_rate": 4.75126065829284e-05, + "loss": 0.8941, + "mean_token_accuracy": 0.7376525521278381, + "num_tokens": 197523068.0, + "step": 83160 + }, + { + "epoch": 0.7625378197487852, + "learning_rate": 4.749426973503255e-05, + "loss": 0.8546, + "mean_token_accuracy": 0.7550153732299805, + "num_tokens": 197550315.0, + "step": 83170 + }, + { + "epoch": 0.7626295039882645, + "learning_rate": 4.74759328871367e-05, + "loss": 0.7762, + "mean_token_accuracy": 0.763424015045166, + "num_tokens": 197578711.0, + "step": 83180 + }, + { + "epoch": 0.7627211882277436, + "learning_rate": 4.745759603924086e-05, + "loss": 0.8624, + "mean_token_accuracy": 0.7480132102966308, + "num_tokens": 197608068.0, + "step": 83190 + }, + { + "epoch": 0.7628128724672228, + "learning_rate": 4.7439259191345007e-05, + "loss": 0.8742, + "mean_token_accuracy": 0.7452224850654602, + "num_tokens": 197639765.0, + "step": 83200 + }, + { + "epoch": 0.7629045567067021, + "learning_rate": 4.7420922343449165e-05, + "loss": 0.8813, + "mean_token_accuracy": 0.7406799018383026, + "num_tokens": 197671467.0, + "step": 83210 + }, + { + "epoch": 0.7629962409461813, + "learning_rate": 4.740258549555332e-05, + "loss": 0.8808, + "mean_token_accuracy": 0.7393268704414367, + "num_tokens": 197701847.0, + "step": 83220 + }, + { + "epoch": 0.7630879251856606, + "learning_rate": 4.738424864765747e-05, + "loss": 0.8206, + "mean_token_accuracy": 0.7561595857143402, + "num_tokens": 197730915.0, + "step": 83230 + }, + { + "epoch": 0.7631796094251398, + "learning_rate": 4.736591179976163e-05, + "loss": 0.7857, + "mean_token_accuracy": 0.764354532957077, + "num_tokens": 197759327.0, + "step": 83240 + }, + { + "epoch": 0.7632712936646191, + "learning_rate": 4.734757495186577e-05, + "loss": 0.8239, + "mean_token_accuracy": 0.7565077424049378, + "num_tokens": 197790398.0, + "step": 83250 + }, + { + "epoch": 0.7633629779040982, + "learning_rate": 4.732923810396993e-05, + "loss": 0.9003, + "mean_token_accuracy": 0.7374303638935089, + "num_tokens": 197822397.0, + "step": 83260 + }, + { + "epoch": 0.7634546621435775, + "learning_rate": 4.731090125607408e-05, + "loss": 0.8814, + "mean_token_accuracy": 0.7407468259334564, + "num_tokens": 197853152.0, + "step": 83270 + }, + { + "epoch": 0.7635463463830567, + "learning_rate": 4.7292564408178235e-05, + "loss": 0.9331, + "mean_token_accuracy": 0.7341228485107422, + "num_tokens": 197885302.0, + "step": 83280 + }, + { + "epoch": 0.763638030622536, + "learning_rate": 4.7274227560282394e-05, + "loss": 0.7912, + "mean_token_accuracy": 0.768936812877655, + "num_tokens": 197914041.0, + "step": 83290 + }, + { + "epoch": 0.7637297148620152, + "learning_rate": 4.725589071238654e-05, + "loss": 0.847, + "mean_token_accuracy": 0.7490604758262634, + "num_tokens": 197942657.0, + "step": 83300 + }, + { + "epoch": 0.7638213991014945, + "learning_rate": 4.72375538644907e-05, + "loss": 0.8241, + "mean_token_accuracy": 0.7578671872615814, + "num_tokens": 197971980.0, + "step": 83310 + }, + { + "epoch": 0.7639130833409737, + "learning_rate": 4.721921701659485e-05, + "loss": 0.877, + "mean_token_accuracy": 0.7484039485454559, + "num_tokens": 198002428.0, + "step": 83320 + }, + { + "epoch": 0.7640047675804529, + "learning_rate": 4.7200880168699e-05, + "loss": 0.9238, + "mean_token_accuracy": 0.7342865407466889, + "num_tokens": 198034811.0, + "step": 83330 + }, + { + "epoch": 0.7640964518199321, + "learning_rate": 4.718254332080316e-05, + "loss": 0.8576, + "mean_token_accuracy": 0.7481640815734864, + "num_tokens": 198066354.0, + "step": 83340 + }, + { + "epoch": 0.7641881360594114, + "learning_rate": 4.7164206472907305e-05, + "loss": 0.7919, + "mean_token_accuracy": 0.76490917801857, + "num_tokens": 198094464.0, + "step": 83350 + }, + { + "epoch": 0.7642798202988906, + "learning_rate": 4.7145869625011464e-05, + "loss": 0.8135, + "mean_token_accuracy": 0.7590794086456298, + "num_tokens": 198123125.0, + "step": 83360 + }, + { + "epoch": 0.7643715045383699, + "learning_rate": 4.7127532777115615e-05, + "loss": 0.87, + "mean_token_accuracy": 0.7405919671058655, + "num_tokens": 198154745.0, + "step": 83370 + }, + { + "epoch": 0.7644631887778491, + "learning_rate": 4.710919592921977e-05, + "loss": 0.9065, + "mean_token_accuracy": 0.7394024491310119, + "num_tokens": 198186066.0, + "step": 83380 + }, + { + "epoch": 0.7645548730173283, + "learning_rate": 4.7090859081323926e-05, + "loss": 0.8664, + "mean_token_accuracy": 0.7451089084148407, + "num_tokens": 198215268.0, + "step": 83390 + }, + { + "epoch": 0.7646465572568075, + "learning_rate": 4.707252223342807e-05, + "loss": 0.9282, + "mean_token_accuracy": 0.7341436266899108, + "num_tokens": 198245601.0, + "step": 83400 + }, + { + "epoch": 0.7647382414962868, + "learning_rate": 4.705418538553223e-05, + "loss": 0.8043, + "mean_token_accuracy": 0.7628137052059174, + "num_tokens": 198273978.0, + "step": 83410 + }, + { + "epoch": 0.764829925735766, + "learning_rate": 4.703584853763638e-05, + "loss": 0.8209, + "mean_token_accuracy": 0.7553904771804809, + "num_tokens": 198302357.0, + "step": 83420 + }, + { + "epoch": 0.7649216099752453, + "learning_rate": 4.701751168974053e-05, + "loss": 0.8497, + "mean_token_accuracy": 0.7504721581935883, + "num_tokens": 198332530.0, + "step": 83430 + }, + { + "epoch": 0.7650132942147245, + "learning_rate": 4.699917484184469e-05, + "loss": 0.8985, + "mean_token_accuracy": 0.7399794936180115, + "num_tokens": 198363573.0, + "step": 83440 + }, + { + "epoch": 0.7651049784542038, + "learning_rate": 4.6980837993948844e-05, + "loss": 0.8401, + "mean_token_accuracy": 0.7502639472484589, + "num_tokens": 198393768.0, + "step": 83450 + }, + { + "epoch": 0.7651966626936829, + "learning_rate": 4.6962501146052996e-05, + "loss": 0.876, + "mean_token_accuracy": 0.7438281536102295, + "num_tokens": 198424956.0, + "step": 83460 + }, + { + "epoch": 0.7652883469331622, + "learning_rate": 4.694416429815715e-05, + "loss": 0.8343, + "mean_token_accuracy": 0.7502440989017487, + "num_tokens": 198452901.0, + "step": 83470 + }, + { + "epoch": 0.7653800311726414, + "learning_rate": 4.69258274502613e-05, + "loss": 0.7875, + "mean_token_accuracy": 0.761256217956543, + "num_tokens": 198481584.0, + "step": 83480 + }, + { + "epoch": 0.7654717154121207, + "learning_rate": 4.690749060236546e-05, + "loss": 0.8424, + "mean_token_accuracy": 0.7500324428081513, + "num_tokens": 198510949.0, + "step": 83490 + }, + { + "epoch": 0.7655633996515999, + "learning_rate": 4.688915375446961e-05, + "loss": 0.8741, + "mean_token_accuracy": 0.7372589588165284, + "num_tokens": 198541344.0, + "step": 83500 + }, + { + "epoch": 0.7656550838910792, + "learning_rate": 4.687081690657376e-05, + "loss": 0.8291, + "mean_token_accuracy": 0.7572034418582916, + "num_tokens": 198570505.0, + "step": 83510 + }, + { + "epoch": 0.7657467681305583, + "learning_rate": 4.6852480058677914e-05, + "loss": 0.8831, + "mean_token_accuracy": 0.7366003334522248, + "num_tokens": 198601033.0, + "step": 83520 + }, + { + "epoch": 0.7658384523700376, + "learning_rate": 4.6834143210782066e-05, + "loss": 0.7692, + "mean_token_accuracy": 0.7724420845508575, + "num_tokens": 198628800.0, + "step": 83530 + }, + { + "epoch": 0.7659301366095168, + "learning_rate": 4.6815806362886224e-05, + "loss": 0.8236, + "mean_token_accuracy": 0.7546740949153901, + "num_tokens": 198656600.0, + "step": 83540 + }, + { + "epoch": 0.7660218208489961, + "learning_rate": 4.6797469514990376e-05, + "loss": 0.8618, + "mean_token_accuracy": 0.7460628628730774, + "num_tokens": 198685408.0, + "step": 83550 + }, + { + "epoch": 0.7661135050884753, + "learning_rate": 4.677913266709453e-05, + "loss": 0.8539, + "mean_token_accuracy": 0.7493011832237244, + "num_tokens": 198715341.0, + "step": 83560 + }, + { + "epoch": 0.7662051893279546, + "learning_rate": 4.676079581919868e-05, + "loss": 0.8612, + "mean_token_accuracy": 0.7442546784877777, + "num_tokens": 198745625.0, + "step": 83570 + }, + { + "epoch": 0.7662968735674338, + "learning_rate": 4.674245897130283e-05, + "loss": 0.8705, + "mean_token_accuracy": 0.7369942724704742, + "num_tokens": 198777699.0, + "step": 83580 + }, + { + "epoch": 0.766388557806913, + "learning_rate": 4.672412212340699e-05, + "loss": 0.8153, + "mean_token_accuracy": 0.7576233804225921, + "num_tokens": 198807217.0, + "step": 83590 + }, + { + "epoch": 0.7664802420463922, + "learning_rate": 4.670578527551114e-05, + "loss": 0.7992, + "mean_token_accuracy": 0.7615856409072876, + "num_tokens": 198835789.0, + "step": 83600 + }, + { + "epoch": 0.7665719262858715, + "learning_rate": 4.6687448427615294e-05, + "loss": 0.8994, + "mean_token_accuracy": 0.7378689825534821, + "num_tokens": 198866279.0, + "step": 83610 + }, + { + "epoch": 0.7666636105253507, + "learning_rate": 4.6669111579719446e-05, + "loss": 0.838, + "mean_token_accuracy": 0.753299742937088, + "num_tokens": 198897040.0, + "step": 83620 + }, + { + "epoch": 0.76675529476483, + "learning_rate": 4.6650774731823605e-05, + "loss": 0.8763, + "mean_token_accuracy": 0.7379263043403625, + "num_tokens": 198926864.0, + "step": 83630 + }, + { + "epoch": 0.7668469790043092, + "learning_rate": 4.6632437883927756e-05, + "loss": 0.8474, + "mean_token_accuracy": 0.7527245163917542, + "num_tokens": 198956688.0, + "step": 83640 + }, + { + "epoch": 0.7669386632437883, + "learning_rate": 4.661410103603191e-05, + "loss": 0.812, + "mean_token_accuracy": 0.7580152869224548, + "num_tokens": 198984155.0, + "step": 83650 + }, + { + "epoch": 0.7670303474832676, + "learning_rate": 4.659576418813606e-05, + "loss": 0.8323, + "mean_token_accuracy": 0.7555800259113312, + "num_tokens": 199012874.0, + "step": 83660 + }, + { + "epoch": 0.7671220317227468, + "learning_rate": 4.657742734024021e-05, + "loss": 0.8543, + "mean_token_accuracy": 0.7447729170322418, + "num_tokens": 199045041.0, + "step": 83670 + }, + { + "epoch": 0.7672137159622261, + "learning_rate": 4.655909049234437e-05, + "loss": 0.8939, + "mean_token_accuracy": 0.7398266553878784, + "num_tokens": 199075229.0, + "step": 83680 + }, + { + "epoch": 0.7673054002017053, + "learning_rate": 4.654075364444852e-05, + "loss": 0.896, + "mean_token_accuracy": 0.7374585330486297, + "num_tokens": 199106935.0, + "step": 83690 + }, + { + "epoch": 0.7673970844411846, + "learning_rate": 4.6522416796552674e-05, + "loss": 0.908, + "mean_token_accuracy": 0.734346729516983, + "num_tokens": 199139301.0, + "step": 83700 + }, + { + "epoch": 0.7674887686806638, + "learning_rate": 4.6504079948656826e-05, + "loss": 0.7976, + "mean_token_accuracy": 0.7622849762439727, + "num_tokens": 199168604.0, + "step": 83710 + }, + { + "epoch": 0.767580452920143, + "learning_rate": 4.648574310076098e-05, + "loss": 0.8412, + "mean_token_accuracy": 0.7505931615829468, + "num_tokens": 199198406.0, + "step": 83720 + }, + { + "epoch": 0.7676721371596222, + "learning_rate": 4.646740625286514e-05, + "loss": 0.8734, + "mean_token_accuracy": 0.7455028116703033, + "num_tokens": 199228350.0, + "step": 83730 + }, + { + "epoch": 0.7677638213991015, + "learning_rate": 4.644906940496929e-05, + "loss": 0.914, + "mean_token_accuracy": 0.7364421486854553, + "num_tokens": 199260398.0, + "step": 83740 + }, + { + "epoch": 0.7678555056385807, + "learning_rate": 4.643073255707344e-05, + "loss": 0.8972, + "mean_token_accuracy": 0.7416184782981873, + "num_tokens": 199291315.0, + "step": 83750 + }, + { + "epoch": 0.76794718987806, + "learning_rate": 4.641239570917759e-05, + "loss": 0.8853, + "mean_token_accuracy": 0.7424000024795532, + "num_tokens": 199321979.0, + "step": 83760 + }, + { + "epoch": 0.7680388741175392, + "learning_rate": 4.6394058861281744e-05, + "loss": 0.7973, + "mean_token_accuracy": 0.7612855434417725, + "num_tokens": 199350143.0, + "step": 83770 + }, + { + "epoch": 0.7681305583570184, + "learning_rate": 4.63757220133859e-05, + "loss": 0.7887, + "mean_token_accuracy": 0.7664248049259186, + "num_tokens": 199378249.0, + "step": 83780 + }, + { + "epoch": 0.7682222425964976, + "learning_rate": 4.6357385165490055e-05, + "loss": 0.856, + "mean_token_accuracy": 0.74514821767807, + "num_tokens": 199406682.0, + "step": 83790 + }, + { + "epoch": 0.7683139268359769, + "learning_rate": 4.633904831759421e-05, + "loss": 0.8775, + "mean_token_accuracy": 0.7419812917709351, + "num_tokens": 199437232.0, + "step": 83800 + }, + { + "epoch": 0.7684056110754561, + "learning_rate": 4.6320711469698365e-05, + "loss": 0.8988, + "mean_token_accuracy": 0.7366764843463898, + "num_tokens": 199467606.0, + "step": 83810 + }, + { + "epoch": 0.7684972953149354, + "learning_rate": 4.630237462180251e-05, + "loss": 0.9094, + "mean_token_accuracy": 0.734112274646759, + "num_tokens": 199498892.0, + "step": 83820 + }, + { + "epoch": 0.7685889795544146, + "learning_rate": 4.628403777390667e-05, + "loss": 0.8255, + "mean_token_accuracy": 0.7513435065746308, + "num_tokens": 199528224.0, + "step": 83830 + }, + { + "epoch": 0.7686806637938939, + "learning_rate": 4.626570092601082e-05, + "loss": 0.8432, + "mean_token_accuracy": 0.7515334784984589, + "num_tokens": 199557846.0, + "step": 83840 + }, + { + "epoch": 0.768772348033373, + "learning_rate": 4.624736407811497e-05, + "loss": 0.8959, + "mean_token_accuracy": 0.7378568053245544, + "num_tokens": 199589559.0, + "step": 83850 + }, + { + "epoch": 0.7688640322728523, + "learning_rate": 4.622902723021913e-05, + "loss": 0.9457, + "mean_token_accuracy": 0.7292453050613403, + "num_tokens": 199622291.0, + "step": 83860 + }, + { + "epoch": 0.7689557165123315, + "learning_rate": 4.6210690382323277e-05, + "loss": 0.8829, + "mean_token_accuracy": 0.7407571256160737, + "num_tokens": 199652353.0, + "step": 83870 + }, + { + "epoch": 0.7690474007518108, + "learning_rate": 4.6192353534427435e-05, + "loss": 0.9178, + "mean_token_accuracy": 0.7299648880958557, + "num_tokens": 199683926.0, + "step": 83880 + }, + { + "epoch": 0.76913908499129, + "learning_rate": 4.617401668653159e-05, + "loss": 0.7779, + "mean_token_accuracy": 0.7676116824150085, + "num_tokens": 199711655.0, + "step": 83890 + }, + { + "epoch": 0.7692307692307693, + "learning_rate": 4.615567983863574e-05, + "loss": 0.8324, + "mean_token_accuracy": 0.7521481812000275, + "num_tokens": 199740477.0, + "step": 83900 + }, + { + "epoch": 0.7693224534702484, + "learning_rate": 4.61373429907399e-05, + "loss": 0.8689, + "mean_token_accuracy": 0.7458119213581085, + "num_tokens": 199769862.0, + "step": 83910 + }, + { + "epoch": 0.7694141377097277, + "learning_rate": 4.611900614284404e-05, + "loss": 0.8911, + "mean_token_accuracy": 0.7416059374809265, + "num_tokens": 199802392.0, + "step": 83920 + }, + { + "epoch": 0.7695058219492069, + "learning_rate": 4.61006692949482e-05, + "loss": 0.9199, + "mean_token_accuracy": 0.736228609085083, + "num_tokens": 199834387.0, + "step": 83930 + }, + { + "epoch": 0.7695975061886862, + "learning_rate": 4.608233244705236e-05, + "loss": 0.8846, + "mean_token_accuracy": 0.7385479390621186, + "num_tokens": 199866001.0, + "step": 83940 + }, + { + "epoch": 0.7696891904281654, + "learning_rate": 4.6063995599156505e-05, + "loss": 0.8315, + "mean_token_accuracy": 0.7526941895484924, + "num_tokens": 199896559.0, + "step": 83950 + }, + { + "epoch": 0.7697808746676447, + "learning_rate": 4.6045658751260664e-05, + "loss": 0.7973, + "mean_token_accuracy": 0.758766508102417, + "num_tokens": 199925437.0, + "step": 83960 + }, + { + "epoch": 0.7698725589071239, + "learning_rate": 4.602732190336481e-05, + "loss": 0.8696, + "mean_token_accuracy": 0.7400624334812165, + "num_tokens": 199954560.0, + "step": 83970 + }, + { + "epoch": 0.7699642431466031, + "learning_rate": 4.600898505546897e-05, + "loss": 0.92, + "mean_token_accuracy": 0.7286685883998871, + "num_tokens": 199987075.0, + "step": 83980 + }, + { + "epoch": 0.7700559273860823, + "learning_rate": 4.5990648207573126e-05, + "loss": 0.8926, + "mean_token_accuracy": 0.7395737707614899, + "num_tokens": 200016068.0, + "step": 83990 + }, + { + "epoch": 0.7701476116255616, + "learning_rate": 4.597231135967727e-05, + "loss": 0.9438, + "mean_token_accuracy": 0.7261269629001618, + "num_tokens": 200048478.0, + "step": 84000 + }, + { + "epoch": 0.7702392958650408, + "learning_rate": 4.595397451178143e-05, + "loss": 0.8153, + "mean_token_accuracy": 0.7573321878910064, + "num_tokens": 200075808.0, + "step": 84010 + }, + { + "epoch": 0.7703309801045201, + "learning_rate": 4.5935637663885575e-05, + "loss": 0.8183, + "mean_token_accuracy": 0.7568739056587219, + "num_tokens": 200104732.0, + "step": 84020 + }, + { + "epoch": 0.7704226643439993, + "learning_rate": 4.5917300815989733e-05, + "loss": 0.8919, + "mean_token_accuracy": 0.7371907711029053, + "num_tokens": 200135263.0, + "step": 84030 + }, + { + "epoch": 0.7705143485834784, + "learning_rate": 4.589896396809389e-05, + "loss": 0.892, + "mean_token_accuracy": 0.7385146617889404, + "num_tokens": 200167528.0, + "step": 84040 + }, + { + "epoch": 0.7706060328229577, + "learning_rate": 4.588062712019804e-05, + "loss": 0.8677, + "mean_token_accuracy": 0.7420639574527741, + "num_tokens": 200198130.0, + "step": 84050 + }, + { + "epoch": 0.770697717062437, + "learning_rate": 4.5862290272302196e-05, + "loss": 0.9424, + "mean_token_accuracy": 0.7321244180202484, + "num_tokens": 200230737.0, + "step": 84060 + }, + { + "epoch": 0.7707894013019162, + "learning_rate": 4.584395342440634e-05, + "loss": 0.8257, + "mean_token_accuracy": 0.7498086869716645, + "num_tokens": 200259700.0, + "step": 84070 + }, + { + "epoch": 0.7708810855413954, + "learning_rate": 4.58256165765105e-05, + "loss": 0.7886, + "mean_token_accuracy": 0.7610655963420868, + "num_tokens": 200289453.0, + "step": 84080 + }, + { + "epoch": 0.7709727697808747, + "learning_rate": 4.580727972861466e-05, + "loss": 0.8737, + "mean_token_accuracy": 0.7464800536632538, + "num_tokens": 200319562.0, + "step": 84090 + }, + { + "epoch": 0.771064454020354, + "learning_rate": 4.57889428807188e-05, + "loss": 0.8658, + "mean_token_accuracy": 0.743821769952774, + "num_tokens": 200350979.0, + "step": 84100 + }, + { + "epoch": 0.7711561382598331, + "learning_rate": 4.577060603282296e-05, + "loss": 0.8971, + "mean_token_accuracy": 0.7383689880371094, + "num_tokens": 200382264.0, + "step": 84110 + }, + { + "epoch": 0.7712478224993123, + "learning_rate": 4.5752269184927114e-05, + "loss": 0.9323, + "mean_token_accuracy": 0.725857412815094, + "num_tokens": 200415235.0, + "step": 84120 + }, + { + "epoch": 0.7713395067387916, + "learning_rate": 4.5733932337031266e-05, + "loss": 0.8418, + "mean_token_accuracy": 0.747672826051712, + "num_tokens": 200445720.0, + "step": 84130 + }, + { + "epoch": 0.7714311909782708, + "learning_rate": 4.5715595489135424e-05, + "loss": 0.803, + "mean_token_accuracy": 0.7635540187358856, + "num_tokens": 200476026.0, + "step": 84140 + }, + { + "epoch": 0.7715228752177501, + "learning_rate": 4.569725864123957e-05, + "loss": 0.8746, + "mean_token_accuracy": 0.7424876809120178, + "num_tokens": 200506677.0, + "step": 84150 + }, + { + "epoch": 0.7716145594572293, + "learning_rate": 4.567892179334373e-05, + "loss": 0.89, + "mean_token_accuracy": 0.7448381662368775, + "num_tokens": 200538444.0, + "step": 84160 + }, + { + "epoch": 0.7717062436967085, + "learning_rate": 4.566058494544788e-05, + "loss": 0.9157, + "mean_token_accuracy": 0.7318846702575683, + "num_tokens": 200570153.0, + "step": 84170 + }, + { + "epoch": 0.7717979279361877, + "learning_rate": 4.564224809755203e-05, + "loss": 0.9456, + "mean_token_accuracy": 0.7250260949134827, + "num_tokens": 200602444.0, + "step": 84180 + }, + { + "epoch": 0.771889612175667, + "learning_rate": 4.562391124965619e-05, + "loss": 0.8404, + "mean_token_accuracy": 0.7524682223796845, + "num_tokens": 200631794.0, + "step": 84190 + }, + { + "epoch": 0.7719812964151462, + "learning_rate": 4.5605574401760336e-05, + "loss": 0.8398, + "mean_token_accuracy": 0.7515843987464905, + "num_tokens": 200660885.0, + "step": 84200 + }, + { + "epoch": 0.7720729806546255, + "learning_rate": 4.5587237553864494e-05, + "loss": 0.8494, + "mean_token_accuracy": 0.7495680034160614, + "num_tokens": 200689887.0, + "step": 84210 + }, + { + "epoch": 0.7721646648941047, + "learning_rate": 4.5568900705968646e-05, + "loss": 0.8933, + "mean_token_accuracy": 0.74183189868927, + "num_tokens": 200721427.0, + "step": 84220 + }, + { + "epoch": 0.772256349133584, + "learning_rate": 4.55505638580728e-05, + "loss": 0.9562, + "mean_token_accuracy": 0.7235827565193176, + "num_tokens": 200754076.0, + "step": 84230 + }, + { + "epoch": 0.7723480333730631, + "learning_rate": 4.5532227010176957e-05, + "loss": 0.9456, + "mean_token_accuracy": 0.7272350370883942, + "num_tokens": 200786233.0, + "step": 84240 + }, + { + "epoch": 0.7724397176125424, + "learning_rate": 4.551389016228111e-05, + "loss": 0.864, + "mean_token_accuracy": 0.751090008020401, + "num_tokens": 200816630.0, + "step": 84250 + }, + { + "epoch": 0.7725314018520216, + "learning_rate": 4.549555331438526e-05, + "loss": 0.8299, + "mean_token_accuracy": 0.7541809618473053, + "num_tokens": 200846453.0, + "step": 84260 + }, + { + "epoch": 0.7726230860915009, + "learning_rate": 4.547721646648941e-05, + "loss": 0.8606, + "mean_token_accuracy": 0.7469097554683686, + "num_tokens": 200878278.0, + "step": 84270 + }, + { + "epoch": 0.7727147703309801, + "learning_rate": 4.5458879618593564e-05, + "loss": 0.9055, + "mean_token_accuracy": 0.7331558406352997, + "num_tokens": 200910438.0, + "step": 84280 + }, + { + "epoch": 0.7728064545704594, + "learning_rate": 4.544054277069772e-05, + "loss": 0.9232, + "mean_token_accuracy": 0.7295502841472625, + "num_tokens": 200942229.0, + "step": 84290 + }, + { + "epoch": 0.7728981388099385, + "learning_rate": 4.5422205922801875e-05, + "loss": 0.9289, + "mean_token_accuracy": 0.7294548392295838, + "num_tokens": 200973791.0, + "step": 84300 + }, + { + "epoch": 0.7729898230494178, + "learning_rate": 4.5403869074906026e-05, + "loss": 0.8163, + "mean_token_accuracy": 0.7611810564994812, + "num_tokens": 201002468.0, + "step": 84310 + }, + { + "epoch": 0.773081507288897, + "learning_rate": 4.538553222701018e-05, + "loss": 0.8038, + "mean_token_accuracy": 0.7570303320884705, + "num_tokens": 201030933.0, + "step": 84320 + }, + { + "epoch": 0.7731731915283763, + "learning_rate": 4.536719537911433e-05, + "loss": 0.8405, + "mean_token_accuracy": 0.7499175071716309, + "num_tokens": 201060148.0, + "step": 84330 + }, + { + "epoch": 0.7732648757678555, + "learning_rate": 4.534885853121849e-05, + "loss": 0.9224, + "mean_token_accuracy": 0.7309393227100373, + "num_tokens": 201092407.0, + "step": 84340 + }, + { + "epoch": 0.7733565600073348, + "learning_rate": 4.533052168332264e-05, + "loss": 0.9403, + "mean_token_accuracy": 0.7300654292106629, + "num_tokens": 201124023.0, + "step": 84350 + }, + { + "epoch": 0.773448244246814, + "learning_rate": 4.531218483542679e-05, + "loss": 0.8964, + "mean_token_accuracy": 0.7361896634101868, + "num_tokens": 201157314.0, + "step": 84360 + }, + { + "epoch": 0.7735399284862932, + "learning_rate": 4.5293847987530944e-05, + "loss": 0.8118, + "mean_token_accuracy": 0.7588523328304291, + "num_tokens": 201187175.0, + "step": 84370 + }, + { + "epoch": 0.7736316127257724, + "learning_rate": 4.5275511139635096e-05, + "loss": 0.8386, + "mean_token_accuracy": 0.7514602661132812, + "num_tokens": 201215879.0, + "step": 84380 + }, + { + "epoch": 0.7737232969652517, + "learning_rate": 4.5257174291739255e-05, + "loss": 0.8733, + "mean_token_accuracy": 0.7433182656764984, + "num_tokens": 201246132.0, + "step": 84390 + }, + { + "epoch": 0.7738149812047309, + "learning_rate": 4.523883744384341e-05, + "loss": 0.8868, + "mean_token_accuracy": 0.7378167867660522, + "num_tokens": 201277352.0, + "step": 84400 + }, + { + "epoch": 0.7739066654442102, + "learning_rate": 4.522050059594756e-05, + "loss": 0.9115, + "mean_token_accuracy": 0.7333837032318116, + "num_tokens": 201307674.0, + "step": 84410 + }, + { + "epoch": 0.7739983496836894, + "learning_rate": 4.520216374805171e-05, + "loss": 0.9436, + "mean_token_accuracy": 0.7246712803840637, + "num_tokens": 201338505.0, + "step": 84420 + }, + { + "epoch": 0.7740900339231686, + "learning_rate": 4.518382690015587e-05, + "loss": 0.8314, + "mean_token_accuracy": 0.7528190314769745, + "num_tokens": 201368586.0, + "step": 84430 + }, + { + "epoch": 0.7741817181626478, + "learning_rate": 4.516549005226002e-05, + "loss": 0.8547, + "mean_token_accuracy": 0.7471593379974365, + "num_tokens": 201398791.0, + "step": 84440 + }, + { + "epoch": 0.774273402402127, + "learning_rate": 4.514715320436417e-05, + "loss": 0.8734, + "mean_token_accuracy": 0.7454115688800812, + "num_tokens": 201428615.0, + "step": 84450 + }, + { + "epoch": 0.7743650866416063, + "learning_rate": 4.5128816356468325e-05, + "loss": 0.8787, + "mean_token_accuracy": 0.7385600090026856, + "num_tokens": 201457486.0, + "step": 84460 + }, + { + "epoch": 0.7744567708810856, + "learning_rate": 4.511047950857248e-05, + "loss": 0.9413, + "mean_token_accuracy": 0.7282081961631774, + "num_tokens": 201490066.0, + "step": 84470 + }, + { + "epoch": 0.7745484551205648, + "learning_rate": 4.5092142660676635e-05, + "loss": 0.9275, + "mean_token_accuracy": 0.7271670460700989, + "num_tokens": 201521823.0, + "step": 84480 + }, + { + "epoch": 0.774640139360044, + "learning_rate": 4.507380581278079e-05, + "loss": 0.816, + "mean_token_accuracy": 0.7563360810279847, + "num_tokens": 201551414.0, + "step": 84490 + }, + { + "epoch": 0.7747318235995232, + "learning_rate": 4.505546896488494e-05, + "loss": 0.828, + "mean_token_accuracy": 0.751528549194336, + "num_tokens": 201581548.0, + "step": 84500 + }, + { + "epoch": 0.7748235078390024, + "learning_rate": 4.503713211698909e-05, + "loss": 0.8881, + "mean_token_accuracy": 0.7387636959552765, + "num_tokens": 201612070.0, + "step": 84510 + }, + { + "epoch": 0.7749151920784817, + "learning_rate": 4.501879526909324e-05, + "loss": 0.9027, + "mean_token_accuracy": 0.7346662044525146, + "num_tokens": 201643590.0, + "step": 84520 + }, + { + "epoch": 0.775006876317961, + "learning_rate": 4.50004584211974e-05, + "loss": 0.8896, + "mean_token_accuracy": 0.73323375582695, + "num_tokens": 201676507.0, + "step": 84530 + }, + { + "epoch": 0.7750985605574402, + "learning_rate": 4.498212157330155e-05, + "loss": 0.8294, + "mean_token_accuracy": 0.7489039301872253, + "num_tokens": 201706025.0, + "step": 84540 + }, + { + "epoch": 0.7751902447969194, + "learning_rate": 4.4963784725405705e-05, + "loss": 0.8175, + "mean_token_accuracy": 0.7632289946079254, + "num_tokens": 201736084.0, + "step": 84550 + }, + { + "epoch": 0.7752819290363987, + "learning_rate": 4.4945447877509864e-05, + "loss": 0.8187, + "mean_token_accuracy": 0.7637658715248108, + "num_tokens": 201765245.0, + "step": 84560 + }, + { + "epoch": 0.7753736132758778, + "learning_rate": 4.492711102961401e-05, + "loss": 0.8779, + "mean_token_accuracy": 0.7411769688129425, + "num_tokens": 201796342.0, + "step": 84570 + }, + { + "epoch": 0.7754652975153571, + "learning_rate": 4.490877418171817e-05, + "loss": 0.8723, + "mean_token_accuracy": 0.7425032436847687, + "num_tokens": 201827445.0, + "step": 84580 + }, + { + "epoch": 0.7755569817548363, + "learning_rate": 4.489043733382232e-05, + "loss": 0.919, + "mean_token_accuracy": 0.733311927318573, + "num_tokens": 201860193.0, + "step": 84590 + }, + { + "epoch": 0.7756486659943156, + "learning_rate": 4.487210048592647e-05, + "loss": 0.8842, + "mean_token_accuracy": 0.7423205018043518, + "num_tokens": 201891888.0, + "step": 84600 + }, + { + "epoch": 0.7757403502337948, + "learning_rate": 4.485376363803063e-05, + "loss": 0.8954, + "mean_token_accuracy": 0.7401693165302277, + "num_tokens": 201922830.0, + "step": 84610 + }, + { + "epoch": 0.7758320344732741, + "learning_rate": 4.4835426790134775e-05, + "loss": 0.8415, + "mean_token_accuracy": 0.7449678301811218, + "num_tokens": 201953230.0, + "step": 84620 + }, + { + "epoch": 0.7759237187127532, + "learning_rate": 4.4817089942238934e-05, + "loss": 0.8791, + "mean_token_accuracy": 0.7392831981182099, + "num_tokens": 201984164.0, + "step": 84630 + }, + { + "epoch": 0.7760154029522325, + "learning_rate": 4.4798753094343086e-05, + "loss": 0.8799, + "mean_token_accuracy": 0.7358763754367829, + "num_tokens": 202016124.0, + "step": 84640 + }, + { + "epoch": 0.7761070871917117, + "learning_rate": 4.478041624644724e-05, + "loss": 0.9292, + "mean_token_accuracy": 0.728614866733551, + "num_tokens": 202047239.0, + "step": 84650 + }, + { + "epoch": 0.776198771431191, + "learning_rate": 4.4762079398551396e-05, + "loss": 0.9635, + "mean_token_accuracy": 0.7204731047153473, + "num_tokens": 202080247.0, + "step": 84660 + }, + { + "epoch": 0.7762904556706702, + "learning_rate": 4.474374255065554e-05, + "loss": 0.8521, + "mean_token_accuracy": 0.7442466080188751, + "num_tokens": 202110467.0, + "step": 84670 + }, + { + "epoch": 0.7763821399101495, + "learning_rate": 4.47254057027597e-05, + "loss": 0.9123, + "mean_token_accuracy": 0.7306386232376099, + "num_tokens": 202140448.0, + "step": 84680 + }, + { + "epoch": 0.7764738241496287, + "learning_rate": 4.470706885486385e-05, + "loss": 0.9171, + "mean_token_accuracy": 0.7329727530479431, + "num_tokens": 202171500.0, + "step": 84690 + }, + { + "epoch": 0.7765655083891079, + "learning_rate": 4.4688732006968003e-05, + "loss": 0.9455, + "mean_token_accuracy": 0.7198031067848205, + "num_tokens": 202202563.0, + "step": 84700 + }, + { + "epoch": 0.7766571926285871, + "learning_rate": 4.467039515907216e-05, + "loss": 0.9206, + "mean_token_accuracy": 0.7255331695079803, + "num_tokens": 202235172.0, + "step": 84710 + }, + { + "epoch": 0.7767488768680664, + "learning_rate": 4.465205831117631e-05, + "loss": 0.9466, + "mean_token_accuracy": 0.7252993047237396, + "num_tokens": 202266689.0, + "step": 84720 + }, + { + "epoch": 0.7768405611075456, + "learning_rate": 4.4633721463280466e-05, + "loss": 0.8708, + "mean_token_accuracy": 0.7456136643886566, + "num_tokens": 202296034.0, + "step": 84730 + }, + { + "epoch": 0.7769322453470249, + "learning_rate": 4.461538461538462e-05, + "loss": 0.9051, + "mean_token_accuracy": 0.7344099283218384, + "num_tokens": 202325764.0, + "step": 84740 + }, + { + "epoch": 0.7770239295865041, + "learning_rate": 4.459704776748877e-05, + "loss": 0.9168, + "mean_token_accuracy": 0.7299425065517425, + "num_tokens": 202357366.0, + "step": 84750 + }, + { + "epoch": 0.7771156138259833, + "learning_rate": 4.457871091959293e-05, + "loss": 0.9272, + "mean_token_accuracy": 0.7272787809371948, + "num_tokens": 202388766.0, + "step": 84760 + }, + { + "epoch": 0.7772072980654625, + "learning_rate": 4.456037407169707e-05, + "loss": 0.9505, + "mean_token_accuracy": 0.7295663893222809, + "num_tokens": 202420890.0, + "step": 84770 + }, + { + "epoch": 0.7772989823049418, + "learning_rate": 4.454203722380123e-05, + "loss": 0.9288, + "mean_token_accuracy": 0.7241439163684845, + "num_tokens": 202453652.0, + "step": 84780 + }, + { + "epoch": 0.777390666544421, + "learning_rate": 4.4523700375905384e-05, + "loss": 0.7904, + "mean_token_accuracy": 0.764022845029831, + "num_tokens": 202483012.0, + "step": 84790 + }, + { + "epoch": 0.7774823507839003, + "learning_rate": 4.4505363528009536e-05, + "loss": 0.876, + "mean_token_accuracy": 0.74369495511055, + "num_tokens": 202512468.0, + "step": 84800 + }, + { + "epoch": 0.7775740350233795, + "learning_rate": 4.4487026680113694e-05, + "loss": 0.8888, + "mean_token_accuracy": 0.7436029970645904, + "num_tokens": 202543085.0, + "step": 84810 + }, + { + "epoch": 0.7776657192628588, + "learning_rate": 4.446868983221784e-05, + "loss": 0.8977, + "mean_token_accuracy": 0.7374972462654114, + "num_tokens": 202574931.0, + "step": 84820 + }, + { + "epoch": 0.7777574035023379, + "learning_rate": 4.4450352984322e-05, + "loss": 0.9219, + "mean_token_accuracy": 0.7311857998371124, + "num_tokens": 202605767.0, + "step": 84830 + }, + { + "epoch": 0.7778490877418172, + "learning_rate": 4.443201613642615e-05, + "loss": 0.9917, + "mean_token_accuracy": 0.708983552455902, + "num_tokens": 202637227.0, + "step": 84840 + }, + { + "epoch": 0.7779407719812964, + "learning_rate": 4.44136792885303e-05, + "loss": 0.8176, + "mean_token_accuracy": 0.7531644344329834, + "num_tokens": 202666585.0, + "step": 84850 + }, + { + "epoch": 0.7780324562207757, + "learning_rate": 4.439534244063446e-05, + "loss": 0.8822, + "mean_token_accuracy": 0.7419060647487641, + "num_tokens": 202695105.0, + "step": 84860 + }, + { + "epoch": 0.7781241404602549, + "learning_rate": 4.437700559273861e-05, + "loss": 0.9061, + "mean_token_accuracy": 0.7396051228046417, + "num_tokens": 202725029.0, + "step": 84870 + }, + { + "epoch": 0.7782158246997342, + "learning_rate": 4.4358668744842764e-05, + "loss": 0.9203, + "mean_token_accuracy": 0.7300542056560516, + "num_tokens": 202756201.0, + "step": 84880 + }, + { + "epoch": 0.7783075089392133, + "learning_rate": 4.4340331896946916e-05, + "loss": 0.9299, + "mean_token_accuracy": 0.7266810297966003, + "num_tokens": 202787496.0, + "step": 84890 + }, + { + "epoch": 0.7783991931786925, + "learning_rate": 4.432199504905107e-05, + "loss": 0.9405, + "mean_token_accuracy": 0.7293095231056214, + "num_tokens": 202818788.0, + "step": 84900 + }, + { + "epoch": 0.7784908774181718, + "learning_rate": 4.4303658201155227e-05, + "loss": 0.8745, + "mean_token_accuracy": 0.7482227504253387, + "num_tokens": 202848512.0, + "step": 84910 + }, + { + "epoch": 0.778582561657651, + "learning_rate": 4.428532135325938e-05, + "loss": 0.9322, + "mean_token_accuracy": 0.7277007639408112, + "num_tokens": 202880024.0, + "step": 84920 + }, + { + "epoch": 0.7786742458971303, + "learning_rate": 4.426698450536353e-05, + "loss": 0.8641, + "mean_token_accuracy": 0.7422133386135101, + "num_tokens": 202908196.0, + "step": 84930 + }, + { + "epoch": 0.7787659301366096, + "learning_rate": 4.424864765746768e-05, + "loss": 0.9212, + "mean_token_accuracy": 0.7326892197132111, + "num_tokens": 202939300.0, + "step": 84940 + }, + { + "epoch": 0.7788576143760888, + "learning_rate": 4.4230310809571834e-05, + "loss": 0.9712, + "mean_token_accuracy": 0.7154947459697724, + "num_tokens": 202970845.0, + "step": 84950 + }, + { + "epoch": 0.7789492986155679, + "learning_rate": 4.421197396167599e-05, + "loss": 1.0009, + "mean_token_accuracy": 0.709311020374298, + "num_tokens": 203003510.0, + "step": 84960 + }, + { + "epoch": 0.7790409828550472, + "learning_rate": 4.4193637113780145e-05, + "loss": 0.871, + "mean_token_accuracy": 0.7473345458507538, + "num_tokens": 203033017.0, + "step": 84970 + }, + { + "epoch": 0.7791326670945264, + "learning_rate": 4.4175300265884296e-05, + "loss": 0.8542, + "mean_token_accuracy": 0.7498608231544495, + "num_tokens": 203063345.0, + "step": 84980 + }, + { + "epoch": 0.7792243513340057, + "learning_rate": 4.415696341798845e-05, + "loss": 0.9385, + "mean_token_accuracy": 0.7267225861549378, + "num_tokens": 203095697.0, + "step": 84990 + }, + { + "epoch": 0.7793160355734849, + "learning_rate": 4.41386265700926e-05, + "loss": 0.9433, + "mean_token_accuracy": 0.7269436657428742, + "num_tokens": 203124455.0, + "step": 85000 + }, + { + "epoch": 0.7794077198129642, + "learning_rate": 4.412028972219676e-05, + "loss": 0.9273, + "mean_token_accuracy": 0.728283804655075, + "num_tokens": 203154919.0, + "step": 85010 + }, + { + "epoch": 0.7794994040524433, + "learning_rate": 4.410195287430091e-05, + "loss": 0.9829, + "mean_token_accuracy": 0.7103117644786835, + "num_tokens": 203187800.0, + "step": 85020 + }, + { + "epoch": 0.7795910882919226, + "learning_rate": 4.408361602640506e-05, + "loss": 0.9565, + "mean_token_accuracy": 0.7182743668556213, + "num_tokens": 203218880.0, + "step": 85030 + }, + { + "epoch": 0.7796827725314018, + "learning_rate": 4.4065279178509214e-05, + "loss": 0.8866, + "mean_token_accuracy": 0.7394263863563537, + "num_tokens": 203248934.0, + "step": 85040 + }, + { + "epoch": 0.7797744567708811, + "learning_rate": 4.404694233061337e-05, + "loss": 0.9379, + "mean_token_accuracy": 0.7228012382984161, + "num_tokens": 203280843.0, + "step": 85050 + }, + { + "epoch": 0.7798661410103603, + "learning_rate": 4.4028605482717525e-05, + "loss": 0.9425, + "mean_token_accuracy": 0.7212895274162292, + "num_tokens": 203311333.0, + "step": 85060 + }, + { + "epoch": 0.7799578252498396, + "learning_rate": 4.401026863482168e-05, + "loss": 0.9497, + "mean_token_accuracy": 0.7190118849277496, + "num_tokens": 203340792.0, + "step": 85070 + }, + { + "epoch": 0.7800495094893188, + "learning_rate": 4.399193178692583e-05, + "loss": 1.0117, + "mean_token_accuracy": 0.7057639479637146, + "num_tokens": 203373247.0, + "step": 85080 + }, + { + "epoch": 0.780141193728798, + "learning_rate": 4.397359493902998e-05, + "loss": 0.9147, + "mean_token_accuracy": 0.7353187441825867, + "num_tokens": 203403771.0, + "step": 85090 + }, + { + "epoch": 0.7802328779682772, + "learning_rate": 4.395525809113414e-05, + "loss": 0.8419, + "mean_token_accuracy": 0.7530937850475311, + "num_tokens": 203432165.0, + "step": 85100 + }, + { + "epoch": 0.7803245622077565, + "learning_rate": 4.393692124323829e-05, + "loss": 0.9221, + "mean_token_accuracy": 0.7253668546676636, + "num_tokens": 203463622.0, + "step": 85110 + }, + { + "epoch": 0.7804162464472357, + "learning_rate": 4.391858439534244e-05, + "loss": 0.9305, + "mean_token_accuracy": 0.7277561604976654, + "num_tokens": 203493975.0, + "step": 85120 + }, + { + "epoch": 0.780507930686715, + "learning_rate": 4.3900247547446595e-05, + "loss": 0.9299, + "mean_token_accuracy": 0.7265092074871063, + "num_tokens": 203526252.0, + "step": 85130 + }, + { + "epoch": 0.7805996149261942, + "learning_rate": 4.388191069955075e-05, + "loss": 0.9744, + "mean_token_accuracy": 0.7142821848392487, + "num_tokens": 203558265.0, + "step": 85140 + }, + { + "epoch": 0.7806912991656734, + "learning_rate": 4.3863573851654905e-05, + "loss": 0.9289, + "mean_token_accuracy": 0.7281145811080932, + "num_tokens": 203588600.0, + "step": 85150 + }, + { + "epoch": 0.7807829834051526, + "learning_rate": 4.384523700375906e-05, + "loss": 0.8988, + "mean_token_accuracy": 0.7322739660739899, + "num_tokens": 203618580.0, + "step": 85160 + }, + { + "epoch": 0.7808746676446319, + "learning_rate": 4.382690015586321e-05, + "loss": 0.9139, + "mean_token_accuracy": 0.732365733385086, + "num_tokens": 203648771.0, + "step": 85170 + }, + { + "epoch": 0.7809663518841111, + "learning_rate": 4.380856330796737e-05, + "loss": 0.8923, + "mean_token_accuracy": 0.7362757682800293, + "num_tokens": 203679033.0, + "step": 85180 + }, + { + "epoch": 0.7810580361235904, + "learning_rate": 4.379022646007151e-05, + "loss": 0.9599, + "mean_token_accuracy": 0.7195428729057312, + "num_tokens": 203709799.0, + "step": 85190 + }, + { + "epoch": 0.7811497203630696, + "learning_rate": 4.377188961217567e-05, + "loss": 0.9826, + "mean_token_accuracy": 0.7132642209529877, + "num_tokens": 203742326.0, + "step": 85200 + }, + { + "epoch": 0.7812414046025489, + "learning_rate": 4.375355276427982e-05, + "loss": 0.9505, + "mean_token_accuracy": 0.7204755544662476, + "num_tokens": 203772828.0, + "step": 85210 + }, + { + "epoch": 0.781333088842028, + "learning_rate": 4.3735215916383975e-05, + "loss": 0.925, + "mean_token_accuracy": 0.7311704814434051, + "num_tokens": 203803662.0, + "step": 85220 + }, + { + "epoch": 0.7814247730815073, + "learning_rate": 4.3716879068488134e-05, + "loss": 0.908, + "mean_token_accuracy": 0.730689388513565, + "num_tokens": 203835342.0, + "step": 85230 + }, + { + "epoch": 0.7815164573209865, + "learning_rate": 4.369854222059228e-05, + "loss": 0.9193, + "mean_token_accuracy": 0.7279924213886261, + "num_tokens": 203866841.0, + "step": 85240 + }, + { + "epoch": 0.7816081415604658, + "learning_rate": 4.368020537269644e-05, + "loss": 0.9362, + "mean_token_accuracy": 0.7220112979412079, + "num_tokens": 203898902.0, + "step": 85250 + }, + { + "epoch": 0.781699825799945, + "learning_rate": 4.366186852480059e-05, + "loss": 0.982, + "mean_token_accuracy": 0.7149511456489563, + "num_tokens": 203929119.0, + "step": 85260 + }, + { + "epoch": 0.7817915100394243, + "learning_rate": 4.364353167690474e-05, + "loss": 0.8408, + "mean_token_accuracy": 0.7517880320549011, + "num_tokens": 203957857.0, + "step": 85270 + }, + { + "epoch": 0.7818831942789034, + "learning_rate": 4.36251948290089e-05, + "loss": 0.8561, + "mean_token_accuracy": 0.7452545762062073, + "num_tokens": 203987995.0, + "step": 85280 + }, + { + "epoch": 0.7819748785183827, + "learning_rate": 4.3606857981113045e-05, + "loss": 0.9465, + "mean_token_accuracy": 0.7230924427509308, + "num_tokens": 204019828.0, + "step": 85290 + }, + { + "epoch": 0.7820665627578619, + "learning_rate": 4.3588521133217204e-05, + "loss": 0.9771, + "mean_token_accuracy": 0.7162556827068329, + "num_tokens": 204050518.0, + "step": 85300 + }, + { + "epoch": 0.7821582469973412, + "learning_rate": 4.3570184285321355e-05, + "loss": 0.9974, + "mean_token_accuracy": 0.7094563007354736, + "num_tokens": 204081752.0, + "step": 85310 + }, + { + "epoch": 0.7822499312368204, + "learning_rate": 4.355184743742551e-05, + "loss": 0.9511, + "mean_token_accuracy": 0.7223043501377105, + "num_tokens": 204113843.0, + "step": 85320 + }, + { + "epoch": 0.7823416154762997, + "learning_rate": 4.3533510589529666e-05, + "loss": 0.918, + "mean_token_accuracy": 0.7277221381664276, + "num_tokens": 204144549.0, + "step": 85330 + }, + { + "epoch": 0.7824332997157789, + "learning_rate": 4.351517374163381e-05, + "loss": 0.9252, + "mean_token_accuracy": 0.7253208816051483, + "num_tokens": 204174183.0, + "step": 85340 + }, + { + "epoch": 0.782524983955258, + "learning_rate": 4.349683689373797e-05, + "loss": 0.9265, + "mean_token_accuracy": 0.7277453958988189, + "num_tokens": 204203736.0, + "step": 85350 + }, + { + "epoch": 0.7826166681947373, + "learning_rate": 4.347850004584212e-05, + "loss": 0.9236, + "mean_token_accuracy": 0.7261824786663056, + "num_tokens": 204234407.0, + "step": 85360 + }, + { + "epoch": 0.7827083524342165, + "learning_rate": 4.3460163197946273e-05, + "loss": 1.0011, + "mean_token_accuracy": 0.7111550986766815, + "num_tokens": 204265568.0, + "step": 85370 + }, + { + "epoch": 0.7828000366736958, + "learning_rate": 4.344182635005043e-05, + "loss": 1.0047, + "mean_token_accuracy": 0.7094777584075928, + "num_tokens": 204297246.0, + "step": 85380 + }, + { + "epoch": 0.782891720913175, + "learning_rate": 4.342348950215458e-05, + "loss": 0.9529, + "mean_token_accuracy": 0.7222318828105927, + "num_tokens": 204328172.0, + "step": 85390 + }, + { + "epoch": 0.7829834051526543, + "learning_rate": 4.3405152654258736e-05, + "loss": 0.9411, + "mean_token_accuracy": 0.724736875295639, + "num_tokens": 204359965.0, + "step": 85400 + }, + { + "epoch": 0.7830750893921334, + "learning_rate": 4.338681580636289e-05, + "loss": 0.9049, + "mean_token_accuracy": 0.7343593955039978, + "num_tokens": 204388535.0, + "step": 85410 + }, + { + "epoch": 0.7831667736316127, + "learning_rate": 4.336847895846704e-05, + "loss": 0.9364, + "mean_token_accuracy": 0.7264476478099823, + "num_tokens": 204419646.0, + "step": 85420 + }, + { + "epoch": 0.7832584578710919, + "learning_rate": 4.33501421105712e-05, + "loss": 0.9928, + "mean_token_accuracy": 0.7078803420066834, + "num_tokens": 204451427.0, + "step": 85430 + }, + { + "epoch": 0.7833501421105712, + "learning_rate": 4.333180526267534e-05, + "loss": 0.9807, + "mean_token_accuracy": 0.7140648603439331, + "num_tokens": 204483315.0, + "step": 85440 + }, + { + "epoch": 0.7834418263500504, + "learning_rate": 4.33134684147795e-05, + "loss": 0.9581, + "mean_token_accuracy": 0.7227704703807831, + "num_tokens": 204514192.0, + "step": 85450 + }, + { + "epoch": 0.7835335105895297, + "learning_rate": 4.3295131566883654e-05, + "loss": 0.9696, + "mean_token_accuracy": 0.7156088948249817, + "num_tokens": 204546443.0, + "step": 85460 + }, + { + "epoch": 0.7836251948290089, + "learning_rate": 4.3276794718987806e-05, + "loss": 0.9062, + "mean_token_accuracy": 0.7343481063842774, + "num_tokens": 204575418.0, + "step": 85470 + }, + { + "epoch": 0.7837168790684881, + "learning_rate": 4.3258457871091964e-05, + "loss": 0.9247, + "mean_token_accuracy": 0.7347521424293518, + "num_tokens": 204604497.0, + "step": 85480 + }, + { + "epoch": 0.7838085633079673, + "learning_rate": 4.3240121023196116e-05, + "loss": 0.9379, + "mean_token_accuracy": 0.7259818851947785, + "num_tokens": 204636027.0, + "step": 85490 + }, + { + "epoch": 0.7839002475474466, + "learning_rate": 4.322178417530027e-05, + "loss": 0.9598, + "mean_token_accuracy": 0.7194625914096833, + "num_tokens": 204665751.0, + "step": 85500 + }, + { + "epoch": 0.7839919317869258, + "learning_rate": 4.320344732740442e-05, + "loss": 0.9427, + "mean_token_accuracy": 0.7234639585018158, + "num_tokens": 204696619.0, + "step": 85510 + }, + { + "epoch": 0.7840836160264051, + "learning_rate": 4.318511047950857e-05, + "loss": 0.9258, + "mean_token_accuracy": 0.72845818400383, + "num_tokens": 204727234.0, + "step": 85520 + }, + { + "epoch": 0.7841753002658843, + "learning_rate": 4.316677363161273e-05, + "loss": 0.9738, + "mean_token_accuracy": 0.7165741324424744, + "num_tokens": 204758365.0, + "step": 85530 + }, + { + "epoch": 0.7842669845053635, + "learning_rate": 4.314843678371688e-05, + "loss": 0.9308, + "mean_token_accuracy": 0.7249511480331421, + "num_tokens": 204788072.0, + "step": 85540 + }, + { + "epoch": 0.7843586687448427, + "learning_rate": 4.3130099935821034e-05, + "loss": 0.9726, + "mean_token_accuracy": 0.7123758435249329, + "num_tokens": 204820049.0, + "step": 85550 + }, + { + "epoch": 0.784450352984322, + "learning_rate": 4.3111763087925186e-05, + "loss": 0.9901, + "mean_token_accuracy": 0.7127663850784302, + "num_tokens": 204852210.0, + "step": 85560 + }, + { + "epoch": 0.7845420372238012, + "learning_rate": 4.309342624002934e-05, + "loss": 0.9583, + "mean_token_accuracy": 0.7225412964820862, + "num_tokens": 204883826.0, + "step": 85570 + }, + { + "epoch": 0.7846337214632805, + "learning_rate": 4.3075089392133497e-05, + "loss": 0.9376, + "mean_token_accuracy": 0.7293244659900665, + "num_tokens": 204913908.0, + "step": 85580 + }, + { + "epoch": 0.7847254057027597, + "learning_rate": 4.305675254423765e-05, + "loss": 0.9075, + "mean_token_accuracy": 0.7326092720031738, + "num_tokens": 204943379.0, + "step": 85590 + }, + { + "epoch": 0.784817089942239, + "learning_rate": 4.30384156963418e-05, + "loss": 0.963, + "mean_token_accuracy": 0.7229960322380066, + "num_tokens": 204973014.0, + "step": 85600 + }, + { + "epoch": 0.7849087741817181, + "learning_rate": 4.302007884844595e-05, + "loss": 0.9614, + "mean_token_accuracy": 0.7152164518833161, + "num_tokens": 205003916.0, + "step": 85610 + }, + { + "epoch": 0.7850004584211974, + "learning_rate": 4.3001742000550104e-05, + "loss": 0.9744, + "mean_token_accuracy": 0.7146295487880707, + "num_tokens": 205035936.0, + "step": 85620 + }, + { + "epoch": 0.7850921426606766, + "learning_rate": 4.298340515265426e-05, + "loss": 0.8923, + "mean_token_accuracy": 0.7326450228691102, + "num_tokens": 205065906.0, + "step": 85630 + }, + { + "epoch": 0.7851838269001559, + "learning_rate": 4.2965068304758415e-05, + "loss": 0.9256, + "mean_token_accuracy": 0.7261049807071686, + "num_tokens": 205096946.0, + "step": 85640 + }, + { + "epoch": 0.7852755111396351, + "learning_rate": 4.2946731456862566e-05, + "loss": 0.9383, + "mean_token_accuracy": 0.7194655418395997, + "num_tokens": 205127826.0, + "step": 85650 + }, + { + "epoch": 0.7853671953791144, + "learning_rate": 4.292839460896672e-05, + "loss": 0.9784, + "mean_token_accuracy": 0.717509651184082, + "num_tokens": 205158790.0, + "step": 85660 + }, + { + "epoch": 0.7854588796185935, + "learning_rate": 4.291005776107088e-05, + "loss": 0.9821, + "mean_token_accuracy": 0.7088741362094879, + "num_tokens": 205190469.0, + "step": 85670 + }, + { + "epoch": 0.7855505638580728, + "learning_rate": 4.289172091317503e-05, + "loss": 0.9785, + "mean_token_accuracy": 0.7216758668422699, + "num_tokens": 205222866.0, + "step": 85680 + }, + { + "epoch": 0.785642248097552, + "learning_rate": 4.287338406527918e-05, + "loss": 0.9381, + "mean_token_accuracy": 0.7183633208274841, + "num_tokens": 205254301.0, + "step": 85690 + }, + { + "epoch": 0.7857339323370313, + "learning_rate": 4.285504721738333e-05, + "loss": 0.9383, + "mean_token_accuracy": 0.7200577795505524, + "num_tokens": 205285066.0, + "step": 85700 + }, + { + "epoch": 0.7858256165765105, + "learning_rate": 4.2836710369487484e-05, + "loss": 0.9244, + "mean_token_accuracy": 0.7277416586875916, + "num_tokens": 205315437.0, + "step": 85710 + }, + { + "epoch": 0.7859173008159898, + "learning_rate": 4.281837352159164e-05, + "loss": 0.9436, + "mean_token_accuracy": 0.7256674766540527, + "num_tokens": 205345801.0, + "step": 85720 + }, + { + "epoch": 0.786008985055469, + "learning_rate": 4.2800036673695795e-05, + "loss": 0.9864, + "mean_token_accuracy": 0.7110663473606109, + "num_tokens": 205376755.0, + "step": 85730 + }, + { + "epoch": 0.7861006692949482, + "learning_rate": 4.278169982579995e-05, + "loss": 0.94, + "mean_token_accuracy": 0.7245600104331971, + "num_tokens": 205408368.0, + "step": 85740 + }, + { + "epoch": 0.7861923535344274, + "learning_rate": 4.27633629779041e-05, + "loss": 0.9223, + "mean_token_accuracy": 0.7295901298522949, + "num_tokens": 205439240.0, + "step": 85750 + }, + { + "epoch": 0.7862840377739067, + "learning_rate": 4.274502613000825e-05, + "loss": 0.9529, + "mean_token_accuracy": 0.7168604910373688, + "num_tokens": 205470574.0, + "step": 85760 + }, + { + "epoch": 0.7863757220133859, + "learning_rate": 4.272668928211241e-05, + "loss": 0.9254, + "mean_token_accuracy": 0.7269407451152802, + "num_tokens": 205500238.0, + "step": 85770 + }, + { + "epoch": 0.7864674062528652, + "learning_rate": 4.270835243421656e-05, + "loss": 0.9354, + "mean_token_accuracy": 0.723615849018097, + "num_tokens": 205531274.0, + "step": 85780 + }, + { + "epoch": 0.7865590904923444, + "learning_rate": 4.269001558632071e-05, + "loss": 0.9792, + "mean_token_accuracy": 0.7170191884040833, + "num_tokens": 205561885.0, + "step": 85790 + }, + { + "epoch": 0.7866507747318237, + "learning_rate": 4.267167873842487e-05, + "loss": 1.0023, + "mean_token_accuracy": 0.7014797627925873, + "num_tokens": 205594519.0, + "step": 85800 + }, + { + "epoch": 0.7867424589713028, + "learning_rate": 4.265334189052902e-05, + "loss": 0.9237, + "mean_token_accuracy": 0.7250907301902771, + "num_tokens": 205624925.0, + "step": 85810 + }, + { + "epoch": 0.786834143210782, + "learning_rate": 4.2635005042633175e-05, + "loss": 0.9818, + "mean_token_accuracy": 0.718622499704361, + "num_tokens": 205655815.0, + "step": 85820 + }, + { + "epoch": 0.7869258274502613, + "learning_rate": 4.261666819473733e-05, + "loss": 0.9674, + "mean_token_accuracy": 0.7219990491867065, + "num_tokens": 205686521.0, + "step": 85830 + }, + { + "epoch": 0.7870175116897405, + "learning_rate": 4.259833134684148e-05, + "loss": 0.9835, + "mean_token_accuracy": 0.711795425415039, + "num_tokens": 205717221.0, + "step": 85840 + }, + { + "epoch": 0.7871091959292198, + "learning_rate": 4.257999449894564e-05, + "loss": 0.9802, + "mean_token_accuracy": 0.7074107944965362, + "num_tokens": 205748332.0, + "step": 85850 + }, + { + "epoch": 0.787200880168699, + "learning_rate": 4.256165765104978e-05, + "loss": 1.0081, + "mean_token_accuracy": 0.7061544060707092, + "num_tokens": 205779804.0, + "step": 85860 + }, + { + "epoch": 0.7872925644081782, + "learning_rate": 4.254332080315394e-05, + "loss": 0.9367, + "mean_token_accuracy": 0.7253042876720428, + "num_tokens": 205810867.0, + "step": 85870 + }, + { + "epoch": 0.7873842486476574, + "learning_rate": 4.252498395525809e-05, + "loss": 0.9277, + "mean_token_accuracy": 0.7289303541183472, + "num_tokens": 205841162.0, + "step": 85880 + }, + { + "epoch": 0.7874759328871367, + "learning_rate": 4.2506647107362245e-05, + "loss": 0.9194, + "mean_token_accuracy": 0.7317416131496429, + "num_tokens": 205871116.0, + "step": 85890 + }, + { + "epoch": 0.7875676171266159, + "learning_rate": 4.2488310259466404e-05, + "loss": 0.9376, + "mean_token_accuracy": 0.7267865717411042, + "num_tokens": 205902306.0, + "step": 85900 + }, + { + "epoch": 0.7876593013660952, + "learning_rate": 4.246997341157055e-05, + "loss": 1.0033, + "mean_token_accuracy": 0.710684472322464, + "num_tokens": 205933430.0, + "step": 85910 + }, + { + "epoch": 0.7877509856055744, + "learning_rate": 4.245163656367471e-05, + "loss": 0.9965, + "mean_token_accuracy": 0.7057823538780212, + "num_tokens": 205965521.0, + "step": 85920 + }, + { + "epoch": 0.7878426698450537, + "learning_rate": 4.243329971577886e-05, + "loss": 0.9651, + "mean_token_accuracy": 0.7150196135044098, + "num_tokens": 205996241.0, + "step": 85930 + }, + { + "epoch": 0.7879343540845328, + "learning_rate": 4.241496286788301e-05, + "loss": 0.913, + "mean_token_accuracy": 0.7292705357074738, + "num_tokens": 206028691.0, + "step": 85940 + }, + { + "epoch": 0.7880260383240121, + "learning_rate": 4.239662601998717e-05, + "loss": 0.9167, + "mean_token_accuracy": 0.727678781747818, + "num_tokens": 206058956.0, + "step": 85950 + }, + { + "epoch": 0.7881177225634913, + "learning_rate": 4.2378289172091315e-05, + "loss": 0.9074, + "mean_token_accuracy": 0.731557309627533, + "num_tokens": 206088534.0, + "step": 85960 + }, + { + "epoch": 0.7882094068029706, + "learning_rate": 4.2359952324195474e-05, + "loss": 0.9231, + "mean_token_accuracy": 0.7272307634353637, + "num_tokens": 206118561.0, + "step": 85970 + }, + { + "epoch": 0.7883010910424498, + "learning_rate": 4.2341615476299625e-05, + "loss": 0.9724, + "mean_token_accuracy": 0.7200353980064392, + "num_tokens": 206149601.0, + "step": 85980 + }, + { + "epoch": 0.7883927752819291, + "learning_rate": 4.232327862840378e-05, + "loss": 0.941, + "mean_token_accuracy": 0.7229769468307495, + "num_tokens": 206181182.0, + "step": 85990 + }, + { + "epoch": 0.7884844595214082, + "learning_rate": 4.2304941780507936e-05, + "loss": 0.9742, + "mean_token_accuracy": 0.7207611382007599, + "num_tokens": 206212657.0, + "step": 86000 + }, + { + "epoch": 0.7885761437608875, + "learning_rate": 4.228660493261208e-05, + "loss": 0.9226, + "mean_token_accuracy": 0.7291601181030274, + "num_tokens": 206242838.0, + "step": 86010 + }, + { + "epoch": 0.7886678280003667, + "learning_rate": 4.226826808471624e-05, + "loss": 0.9221, + "mean_token_accuracy": 0.7228618323802948, + "num_tokens": 206273413.0, + "step": 86020 + }, + { + "epoch": 0.788759512239846, + "learning_rate": 4.224993123682039e-05, + "loss": 0.9624, + "mean_token_accuracy": 0.7189518511295319, + "num_tokens": 206303787.0, + "step": 86030 + }, + { + "epoch": 0.7888511964793252, + "learning_rate": 4.2231594388924543e-05, + "loss": 1.0058, + "mean_token_accuracy": 0.7108011722564698, + "num_tokens": 206335862.0, + "step": 86040 + }, + { + "epoch": 0.7889428807188045, + "learning_rate": 4.22132575410287e-05, + "loss": 0.9642, + "mean_token_accuracy": 0.7218930304050446, + "num_tokens": 206367383.0, + "step": 86050 + }, + { + "epoch": 0.7890345649582837, + "learning_rate": 4.219492069313285e-05, + "loss": 0.9627, + "mean_token_accuracy": 0.7193548262119294, + "num_tokens": 206399338.0, + "step": 86060 + }, + { + "epoch": 0.7891262491977629, + "learning_rate": 4.2176583845237006e-05, + "loss": 0.9422, + "mean_token_accuracy": 0.7254627764225006, + "num_tokens": 206428629.0, + "step": 86070 + }, + { + "epoch": 0.7892179334372421, + "learning_rate": 4.215824699734116e-05, + "loss": 0.9064, + "mean_token_accuracy": 0.7301589667797088, + "num_tokens": 206459320.0, + "step": 86080 + }, + { + "epoch": 0.7893096176767214, + "learning_rate": 4.213991014944531e-05, + "loss": 1.0068, + "mean_token_accuracy": 0.7062439560890198, + "num_tokens": 206490337.0, + "step": 86090 + }, + { + "epoch": 0.7894013019162006, + "learning_rate": 4.212157330154947e-05, + "loss": 1.0443, + "mean_token_accuracy": 0.701622599363327, + "num_tokens": 206523471.0, + "step": 86100 + }, + { + "epoch": 0.7894929861556799, + "learning_rate": 4.210323645365362e-05, + "loss": 0.938, + "mean_token_accuracy": 0.7256350219249725, + "num_tokens": 206555000.0, + "step": 86110 + }, + { + "epoch": 0.7895846703951591, + "learning_rate": 4.208489960575777e-05, + "loss": 0.9443, + "mean_token_accuracy": 0.7241138577461242, + "num_tokens": 206586403.0, + "step": 86120 + }, + { + "epoch": 0.7896763546346383, + "learning_rate": 4.2066562757861924e-05, + "loss": 0.9196, + "mean_token_accuracy": 0.7292301297187805, + "num_tokens": 206617668.0, + "step": 86130 + }, + { + "epoch": 0.7897680388741175, + "learning_rate": 4.2048225909966076e-05, + "loss": 0.9188, + "mean_token_accuracy": 0.7290456116199493, + "num_tokens": 206647003.0, + "step": 86140 + }, + { + "epoch": 0.7898597231135968, + "learning_rate": 4.2029889062070234e-05, + "loss": 0.9503, + "mean_token_accuracy": 0.7188356459140778, + "num_tokens": 206677488.0, + "step": 86150 + }, + { + "epoch": 0.789951407353076, + "learning_rate": 4.2011552214174386e-05, + "loss": 1.0146, + "mean_token_accuracy": 0.7011561453342438, + "num_tokens": 206710237.0, + "step": 86160 + }, + { + "epoch": 0.7900430915925553, + "learning_rate": 4.199321536627854e-05, + "loss": 0.9456, + "mean_token_accuracy": 0.7251852512359619, + "num_tokens": 206741244.0, + "step": 86170 + }, + { + "epoch": 0.7901347758320345, + "learning_rate": 4.197487851838269e-05, + "loss": 0.9304, + "mean_token_accuracy": 0.726626968383789, + "num_tokens": 206771750.0, + "step": 86180 + }, + { + "epoch": 0.7902264600715138, + "learning_rate": 4.195654167048684e-05, + "loss": 0.9277, + "mean_token_accuracy": 0.7317323207855224, + "num_tokens": 206801113.0, + "step": 86190 + }, + { + "epoch": 0.7903181443109929, + "learning_rate": 4.1938204822591e-05, + "loss": 0.9484, + "mean_token_accuracy": 0.7219361066818237, + "num_tokens": 206831264.0, + "step": 86200 + }, + { + "epoch": 0.7904098285504721, + "learning_rate": 4.191986797469515e-05, + "loss": 0.985, + "mean_token_accuracy": 0.7095797717571258, + "num_tokens": 206861152.0, + "step": 86210 + }, + { + "epoch": 0.7905015127899514, + "learning_rate": 4.1901531126799304e-05, + "loss": 1.0338, + "mean_token_accuracy": 0.7008227586746216, + "num_tokens": 206894524.0, + "step": 86220 + }, + { + "epoch": 0.7905931970294306, + "learning_rate": 4.1883194278903456e-05, + "loss": 0.947, + "mean_token_accuracy": 0.7251901149749755, + "num_tokens": 206926614.0, + "step": 86230 + }, + { + "epoch": 0.7906848812689099, + "learning_rate": 4.186485743100761e-05, + "loss": 0.8958, + "mean_token_accuracy": 0.7344070792198181, + "num_tokens": 206956324.0, + "step": 86240 + }, + { + "epoch": 0.7907765655083892, + "learning_rate": 4.1846520583111767e-05, + "loss": 0.918, + "mean_token_accuracy": 0.7315007209777832, + "num_tokens": 206986553.0, + "step": 86250 + }, + { + "epoch": 0.7908682497478683, + "learning_rate": 4.182818373521592e-05, + "loss": 0.9576, + "mean_token_accuracy": 0.7177666246891021, + "num_tokens": 207015442.0, + "step": 86260 + }, + { + "epoch": 0.7909599339873475, + "learning_rate": 4.180984688732007e-05, + "loss": 0.9983, + "mean_token_accuracy": 0.7080096542835236, + "num_tokens": 207046148.0, + "step": 86270 + }, + { + "epoch": 0.7910516182268268, + "learning_rate": 4.179151003942422e-05, + "loss": 0.993, + "mean_token_accuracy": 0.7078933179378509, + "num_tokens": 207078683.0, + "step": 86280 + }, + { + "epoch": 0.791143302466306, + "learning_rate": 4.177317319152838e-05, + "loss": 0.9512, + "mean_token_accuracy": 0.7187549829483032, + "num_tokens": 207110629.0, + "step": 86290 + }, + { + "epoch": 0.7912349867057853, + "learning_rate": 4.175483634363253e-05, + "loss": 0.9383, + "mean_token_accuracy": 0.7207545340061188, + "num_tokens": 207142785.0, + "step": 86300 + }, + { + "epoch": 0.7913266709452645, + "learning_rate": 4.1736499495736685e-05, + "loss": 0.9432, + "mean_token_accuracy": 0.7170807123184204, + "num_tokens": 207174222.0, + "step": 86310 + }, + { + "epoch": 0.7914183551847438, + "learning_rate": 4.1718162647840836e-05, + "loss": 0.9318, + "mean_token_accuracy": 0.7256855189800262, + "num_tokens": 207203828.0, + "step": 86320 + }, + { + "epoch": 0.7915100394242229, + "learning_rate": 4.169982579994499e-05, + "loss": 0.9996, + "mean_token_accuracy": 0.7121340036392212, + "num_tokens": 207235423.0, + "step": 86330 + }, + { + "epoch": 0.7916017236637022, + "learning_rate": 4.168148895204915e-05, + "loss": 1.025, + "mean_token_accuracy": 0.7054444551467896, + "num_tokens": 207267939.0, + "step": 86340 + }, + { + "epoch": 0.7916934079031814, + "learning_rate": 4.16631521041533e-05, + "loss": 0.9746, + "mean_token_accuracy": 0.7115237712860107, + "num_tokens": 207299252.0, + "step": 86350 + }, + { + "epoch": 0.7917850921426607, + "learning_rate": 4.164481525625745e-05, + "loss": 0.9356, + "mean_token_accuracy": 0.7275644659996032, + "num_tokens": 207330027.0, + "step": 86360 + }, + { + "epoch": 0.7918767763821399, + "learning_rate": 4.16264784083616e-05, + "loss": 0.9645, + "mean_token_accuracy": 0.7202916145324707, + "num_tokens": 207360485.0, + "step": 86370 + }, + { + "epoch": 0.7919684606216192, + "learning_rate": 4.1608141560465754e-05, + "loss": 0.9338, + "mean_token_accuracy": 0.7204845726490021, + "num_tokens": 207390182.0, + "step": 86380 + }, + { + "epoch": 0.7920601448610983, + "learning_rate": 4.158980471256991e-05, + "loss": 0.9812, + "mean_token_accuracy": 0.7126319408416748, + "num_tokens": 207421621.0, + "step": 86390 + }, + { + "epoch": 0.7921518291005776, + "learning_rate": 4.1571467864674065e-05, + "loss": 0.982, + "mean_token_accuracy": 0.7128823220729827, + "num_tokens": 207452915.0, + "step": 86400 + }, + { + "epoch": 0.7922435133400568, + "learning_rate": 4.155313101677822e-05, + "loss": 0.9098, + "mean_token_accuracy": 0.7332341194152832, + "num_tokens": 207485097.0, + "step": 86410 + }, + { + "epoch": 0.7923351975795361, + "learning_rate": 4.1534794168882375e-05, + "loss": 0.9255, + "mean_token_accuracy": 0.726281863451004, + "num_tokens": 207516399.0, + "step": 86420 + }, + { + "epoch": 0.7924268818190153, + "learning_rate": 4.151645732098652e-05, + "loss": 0.9435, + "mean_token_accuracy": 0.7231832683086395, + "num_tokens": 207545822.0, + "step": 86430 + }, + { + "epoch": 0.7925185660584946, + "learning_rate": 4.149812047309068e-05, + "loss": 0.9137, + "mean_token_accuracy": 0.7281588971614837, + "num_tokens": 207577365.0, + "step": 86440 + }, + { + "epoch": 0.7926102502979738, + "learning_rate": 4.147978362519483e-05, + "loss": 0.9902, + "mean_token_accuracy": 0.7107552766799927, + "num_tokens": 207609490.0, + "step": 86450 + }, + { + "epoch": 0.792701934537453, + "learning_rate": 4.146144677729898e-05, + "loss": 1.0435, + "mean_token_accuracy": 0.6976045489311218, + "num_tokens": 207641595.0, + "step": 86460 + }, + { + "epoch": 0.7927936187769322, + "learning_rate": 4.144310992940314e-05, + "loss": 0.9172, + "mean_token_accuracy": 0.7304158270359039, + "num_tokens": 207672793.0, + "step": 86470 + }, + { + "epoch": 0.7928853030164115, + "learning_rate": 4.142477308150729e-05, + "loss": 0.9302, + "mean_token_accuracy": 0.7257893681526184, + "num_tokens": 207704947.0, + "step": 86480 + }, + { + "epoch": 0.7929769872558907, + "learning_rate": 4.1406436233611445e-05, + "loss": 0.8942, + "mean_token_accuracy": 0.7341605126857758, + "num_tokens": 207732974.0, + "step": 86490 + }, + { + "epoch": 0.79306867149537, + "learning_rate": 4.13880993857156e-05, + "loss": 0.9159, + "mean_token_accuracy": 0.7367580354213714, + "num_tokens": 207764858.0, + "step": 86500 + }, + { + "epoch": 0.7931603557348492, + "learning_rate": 4.136976253781975e-05, + "loss": 0.9533, + "mean_token_accuracy": 0.7214776396751403, + "num_tokens": 207796150.0, + "step": 86510 + }, + { + "epoch": 0.7932520399743284, + "learning_rate": 4.135142568992391e-05, + "loss": 1.0098, + "mean_token_accuracy": 0.7000498592853546, + "num_tokens": 207828544.0, + "step": 86520 + }, + { + "epoch": 0.7933437242138076, + "learning_rate": 4.133308884202805e-05, + "loss": 0.9567, + "mean_token_accuracy": 0.7159042656421661, + "num_tokens": 207860620.0, + "step": 86530 + }, + { + "epoch": 0.7934354084532869, + "learning_rate": 4.131475199413221e-05, + "loss": 0.9484, + "mean_token_accuracy": 0.7242303311824798, + "num_tokens": 207891856.0, + "step": 86540 + }, + { + "epoch": 0.7935270926927661, + "learning_rate": 4.129641514623636e-05, + "loss": 0.9261, + "mean_token_accuracy": 0.7282198309898377, + "num_tokens": 207923777.0, + "step": 86550 + }, + { + "epoch": 0.7936187769322454, + "learning_rate": 4.1278078298340515e-05, + "loss": 0.9429, + "mean_token_accuracy": 0.7287190020084381, + "num_tokens": 207952121.0, + "step": 86560 + }, + { + "epoch": 0.7937104611717246, + "learning_rate": 4.1259741450444674e-05, + "loss": 0.9804, + "mean_token_accuracy": 0.7127610504627228, + "num_tokens": 207983744.0, + "step": 86570 + }, + { + "epoch": 0.7938021454112039, + "learning_rate": 4.124140460254882e-05, + "loss": 1.0303, + "mean_token_accuracy": 0.7046155571937561, + "num_tokens": 208016574.0, + "step": 86580 + }, + { + "epoch": 0.793893829650683, + "learning_rate": 4.122306775465298e-05, + "loss": 0.9377, + "mean_token_accuracy": 0.7199788987636566, + "num_tokens": 208048233.0, + "step": 86590 + }, + { + "epoch": 0.7939855138901623, + "learning_rate": 4.1204730906757136e-05, + "loss": 0.9388, + "mean_token_accuracy": 0.7236958265304565, + "num_tokens": 208078638.0, + "step": 86600 + }, + { + "epoch": 0.7940771981296415, + "learning_rate": 4.118639405886128e-05, + "loss": 0.9066, + "mean_token_accuracy": 0.7310633838176728, + "num_tokens": 208109993.0, + "step": 86610 + }, + { + "epoch": 0.7941688823691208, + "learning_rate": 4.116805721096544e-05, + "loss": 0.9464, + "mean_token_accuracy": 0.7216531753540039, + "num_tokens": 208140842.0, + "step": 86620 + }, + { + "epoch": 0.7942605666086, + "learning_rate": 4.1149720363069585e-05, + "loss": 1.0227, + "mean_token_accuracy": 0.7035574436187744, + "num_tokens": 208171321.0, + "step": 86630 + }, + { + "epoch": 0.7943522508480793, + "learning_rate": 4.1131383515173744e-05, + "loss": 0.958, + "mean_token_accuracy": 0.7149340093135834, + "num_tokens": 208202668.0, + "step": 86640 + }, + { + "epoch": 0.7944439350875584, + "learning_rate": 4.11130466672779e-05, + "loss": 0.9444, + "mean_token_accuracy": 0.7256955981254578, + "num_tokens": 208234024.0, + "step": 86650 + }, + { + "epoch": 0.7945356193270376, + "learning_rate": 4.109470981938205e-05, + "loss": 0.9552, + "mean_token_accuracy": 0.721126115322113, + "num_tokens": 208265638.0, + "step": 86660 + }, + { + "epoch": 0.7946273035665169, + "learning_rate": 4.1076372971486206e-05, + "loss": 0.9349, + "mean_token_accuracy": 0.7214091718196869, + "num_tokens": 208295256.0, + "step": 86670 + }, + { + "epoch": 0.7947189878059961, + "learning_rate": 4.105803612359035e-05, + "loss": 0.9303, + "mean_token_accuracy": 0.7256463825702667, + "num_tokens": 208324026.0, + "step": 86680 + }, + { + "epoch": 0.7948106720454754, + "learning_rate": 4.103969927569451e-05, + "loss": 0.9361, + "mean_token_accuracy": 0.7245767474174499, + "num_tokens": 208354238.0, + "step": 86690 + }, + { + "epoch": 0.7949023562849546, + "learning_rate": 4.102136242779867e-05, + "loss": 1.0113, + "mean_token_accuracy": 0.7028233170509338, + "num_tokens": 208387109.0, + "step": 86700 + }, + { + "epoch": 0.7949940405244339, + "learning_rate": 4.1003025579902813e-05, + "loss": 0.9399, + "mean_token_accuracy": 0.7222343683242798, + "num_tokens": 208419858.0, + "step": 86710 + }, + { + "epoch": 0.795085724763913, + "learning_rate": 4.098468873200697e-05, + "loss": 0.9351, + "mean_token_accuracy": 0.7292609870433807, + "num_tokens": 208450896.0, + "step": 86720 + }, + { + "epoch": 0.7951774090033923, + "learning_rate": 4.0966351884111124e-05, + "loss": 0.9541, + "mean_token_accuracy": 0.7215969681739807, + "num_tokens": 208481716.0, + "step": 86730 + }, + { + "epoch": 0.7952690932428715, + "learning_rate": 4.0948015036215276e-05, + "loss": 0.9366, + "mean_token_accuracy": 0.7248545944690704, + "num_tokens": 208511158.0, + "step": 86740 + }, + { + "epoch": 0.7953607774823508, + "learning_rate": 4.0929678188319434e-05, + "loss": 0.9853, + "mean_token_accuracy": 0.7170604169368744, + "num_tokens": 208542521.0, + "step": 86750 + }, + { + "epoch": 0.79545246172183, + "learning_rate": 4.091134134042358e-05, + "loss": 0.9998, + "mean_token_accuracy": 0.7087662935256958, + "num_tokens": 208574677.0, + "step": 86760 + }, + { + "epoch": 0.7955441459613093, + "learning_rate": 4.089300449252774e-05, + "loss": 0.945, + "mean_token_accuracy": 0.7175221562385559, + "num_tokens": 208606521.0, + "step": 86770 + }, + { + "epoch": 0.7956358302007884, + "learning_rate": 4.087466764463189e-05, + "loss": 0.9327, + "mean_token_accuracy": 0.7264738619327545, + "num_tokens": 208637324.0, + "step": 86780 + }, + { + "epoch": 0.7957275144402677, + "learning_rate": 4.085633079673604e-05, + "loss": 0.9405, + "mean_token_accuracy": 0.7284891366958618, + "num_tokens": 208667218.0, + "step": 86790 + }, + { + "epoch": 0.7958191986797469, + "learning_rate": 4.08379939488402e-05, + "loss": 0.9122, + "mean_token_accuracy": 0.7302503824234009, + "num_tokens": 208695456.0, + "step": 86800 + }, + { + "epoch": 0.7959108829192262, + "learning_rate": 4.0819657100944346e-05, + "loss": 0.964, + "mean_token_accuracy": 0.7192913830280304, + "num_tokens": 208727231.0, + "step": 86810 + }, + { + "epoch": 0.7960025671587054, + "learning_rate": 4.0801320253048504e-05, + "loss": 1.0259, + "mean_token_accuracy": 0.6997593402862549, + "num_tokens": 208759898.0, + "step": 86820 + }, + { + "epoch": 0.7960942513981847, + "learning_rate": 4.0782983405152656e-05, + "loss": 0.9517, + "mean_token_accuracy": 0.7208040475845336, + "num_tokens": 208790664.0, + "step": 86830 + }, + { + "epoch": 0.7961859356376639, + "learning_rate": 4.076464655725681e-05, + "loss": 0.9211, + "mean_token_accuracy": 0.7288584172725677, + "num_tokens": 208821993.0, + "step": 86840 + }, + { + "epoch": 0.7962776198771431, + "learning_rate": 4.074630970936097e-05, + "loss": 0.9069, + "mean_token_accuracy": 0.7319348752498627, + "num_tokens": 208853251.0, + "step": 86850 + }, + { + "epoch": 0.7963693041166223, + "learning_rate": 4.072797286146511e-05, + "loss": 0.9621, + "mean_token_accuracy": 0.7171362936496735, + "num_tokens": 208884437.0, + "step": 86860 + }, + { + "epoch": 0.7964609883561016, + "learning_rate": 4.070963601356927e-05, + "loss": 0.9581, + "mean_token_accuracy": 0.7199141204357147, + "num_tokens": 208915128.0, + "step": 86870 + }, + { + "epoch": 0.7965526725955808, + "learning_rate": 4.069129916567342e-05, + "loss": 1.0149, + "mean_token_accuracy": 0.7024094223976135, + "num_tokens": 208947548.0, + "step": 86880 + }, + { + "epoch": 0.7966443568350601, + "learning_rate": 4.0672962317777574e-05, + "loss": 0.9352, + "mean_token_accuracy": 0.723261296749115, + "num_tokens": 208979031.0, + "step": 86890 + }, + { + "epoch": 0.7967360410745393, + "learning_rate": 4.065462546988173e-05, + "loss": 0.9509, + "mean_token_accuracy": 0.7243140757083892, + "num_tokens": 209009123.0, + "step": 86900 + }, + { + "epoch": 0.7968277253140186, + "learning_rate": 4.0636288621985885e-05, + "loss": 0.963, + "mean_token_accuracy": 0.72268648147583, + "num_tokens": 209039210.0, + "step": 86910 + }, + { + "epoch": 0.7969194095534977, + "learning_rate": 4.0617951774090037e-05, + "loss": 0.9351, + "mean_token_accuracy": 0.7223830938339233, + "num_tokens": 209069237.0, + "step": 86920 + }, + { + "epoch": 0.797011093792977, + "learning_rate": 4.059961492619419e-05, + "loss": 0.9747, + "mean_token_accuracy": 0.7122148394584655, + "num_tokens": 209100369.0, + "step": 86930 + }, + { + "epoch": 0.7971027780324562, + "learning_rate": 4.058127807829834e-05, + "loss": 0.9923, + "mean_token_accuracy": 0.7069045722484588, + "num_tokens": 209133037.0, + "step": 86940 + }, + { + "epoch": 0.7971944622719355, + "learning_rate": 4.05629412304025e-05, + "loss": 0.902, + "mean_token_accuracy": 0.7337145149707794, + "num_tokens": 209165006.0, + "step": 86950 + }, + { + "epoch": 0.7972861465114147, + "learning_rate": 4.054460438250665e-05, + "loss": 0.9339, + "mean_token_accuracy": 0.7205852448940278, + "num_tokens": 209196496.0, + "step": 86960 + }, + { + "epoch": 0.797377830750894, + "learning_rate": 4.05262675346108e-05, + "loss": 0.9287, + "mean_token_accuracy": 0.7206258594989776, + "num_tokens": 209226131.0, + "step": 86970 + }, + { + "epoch": 0.7974695149903731, + "learning_rate": 4.0507930686714955e-05, + "loss": 0.9249, + "mean_token_accuracy": 0.7250255346298218, + "num_tokens": 209255177.0, + "step": 86980 + }, + { + "epoch": 0.7975611992298524, + "learning_rate": 4.0489593838819106e-05, + "loss": 0.9618, + "mean_token_accuracy": 0.7173052787780761, + "num_tokens": 209285005.0, + "step": 86990 + }, + { + "epoch": 0.7976528834693316, + "learning_rate": 4.0471256990923265e-05, + "loss": 1.0192, + "mean_token_accuracy": 0.7025117516517639, + "num_tokens": 209316683.0, + "step": 87000 + }, + { + "epoch": 0.7977445677088109, + "learning_rate": 4.045292014302742e-05, + "loss": 0.9388, + "mean_token_accuracy": 0.7230490922927857, + "num_tokens": 209348067.0, + "step": 87010 + }, + { + "epoch": 0.7978362519482901, + "learning_rate": 4.043458329513157e-05, + "loss": 0.9596, + "mean_token_accuracy": 0.7197664737701416, + "num_tokens": 209380138.0, + "step": 87020 + }, + { + "epoch": 0.7979279361877694, + "learning_rate": 4.041624644723572e-05, + "loss": 0.9374, + "mean_token_accuracy": 0.7165299355983734, + "num_tokens": 209410731.0, + "step": 87030 + }, + { + "epoch": 0.7980196204272486, + "learning_rate": 4.039790959933988e-05, + "loss": 0.9274, + "mean_token_accuracy": 0.7212114334106445, + "num_tokens": 209440554.0, + "step": 87040 + }, + { + "epoch": 0.7981113046667277, + "learning_rate": 4.037957275144403e-05, + "loss": 0.9596, + "mean_token_accuracy": 0.7149106860160828, + "num_tokens": 209470542.0, + "step": 87050 + }, + { + "epoch": 0.798202988906207, + "learning_rate": 4.036123590354818e-05, + "loss": 1.0066, + "mean_token_accuracy": 0.7041074275970459, + "num_tokens": 209502895.0, + "step": 87060 + }, + { + "epoch": 0.7982946731456863, + "learning_rate": 4.0342899055652335e-05, + "loss": 0.9236, + "mean_token_accuracy": 0.7260433256626129, + "num_tokens": 209534663.0, + "step": 87070 + }, + { + "epoch": 0.7983863573851655, + "learning_rate": 4.032456220775649e-05, + "loss": 0.9451, + "mean_token_accuracy": 0.7250676095485687, + "num_tokens": 209565168.0, + "step": 87080 + }, + { + "epoch": 0.7984780416246448, + "learning_rate": 4.0306225359860645e-05, + "loss": 0.9323, + "mean_token_accuracy": 0.7251429498195648, + "num_tokens": 209595188.0, + "step": 87090 + }, + { + "epoch": 0.798569725864124, + "learning_rate": 4.02878885119648e-05, + "loss": 0.9534, + "mean_token_accuracy": 0.7167445003986359, + "num_tokens": 209626060.0, + "step": 87100 + }, + { + "epoch": 0.7986614101036031, + "learning_rate": 4.026955166406895e-05, + "loss": 0.9482, + "mean_token_accuracy": 0.7180288314819336, + "num_tokens": 209657260.0, + "step": 87110 + }, + { + "epoch": 0.7987530943430824, + "learning_rate": 4.02512148161731e-05, + "loss": 0.9954, + "mean_token_accuracy": 0.708745276927948, + "num_tokens": 209689358.0, + "step": 87120 + }, + { + "epoch": 0.7988447785825616, + "learning_rate": 4.023287796827725e-05, + "loss": 0.916, + "mean_token_accuracy": 0.7291933119297027, + "num_tokens": 209720348.0, + "step": 87130 + }, + { + "epoch": 0.7989364628220409, + "learning_rate": 4.021454112038141e-05, + "loss": 0.9235, + "mean_token_accuracy": 0.7270193874835968, + "num_tokens": 209749593.0, + "step": 87140 + }, + { + "epoch": 0.7990281470615201, + "learning_rate": 4.019620427248556e-05, + "loss": 0.9296, + "mean_token_accuracy": 0.7201617002487183, + "num_tokens": 209782138.0, + "step": 87150 + }, + { + "epoch": 0.7991198313009994, + "learning_rate": 4.0177867424589715e-05, + "loss": 0.8967, + "mean_token_accuracy": 0.7318171620368957, + "num_tokens": 209811050.0, + "step": 87160 + }, + { + "epoch": 0.7992115155404786, + "learning_rate": 4.015953057669387e-05, + "loss": 0.9692, + "mean_token_accuracy": 0.7147955060005188, + "num_tokens": 209842641.0, + "step": 87170 + }, + { + "epoch": 0.7993031997799578, + "learning_rate": 4.014119372879802e-05, + "loss": 1.0144, + "mean_token_accuracy": 0.7072067379951477, + "num_tokens": 209875507.0, + "step": 87180 + }, + { + "epoch": 0.799394884019437, + "learning_rate": 4.012285688090218e-05, + "loss": 0.9469, + "mean_token_accuracy": 0.7181179940700531, + "num_tokens": 209907302.0, + "step": 87190 + }, + { + "epoch": 0.7994865682589163, + "learning_rate": 4.010452003300633e-05, + "loss": 0.9515, + "mean_token_accuracy": 0.7170276045799255, + "num_tokens": 209938370.0, + "step": 87200 + }, + { + "epoch": 0.7995782524983955, + "learning_rate": 4.008618318511048e-05, + "loss": 0.9073, + "mean_token_accuracy": 0.7291929602622986, + "num_tokens": 209967429.0, + "step": 87210 + }, + { + "epoch": 0.7996699367378748, + "learning_rate": 4.006784633721464e-05, + "loss": 0.9496, + "mean_token_accuracy": 0.7195300698280335, + "num_tokens": 209996925.0, + "step": 87220 + }, + { + "epoch": 0.799761620977354, + "learning_rate": 4.0049509489318785e-05, + "loss": 0.9654, + "mean_token_accuracy": 0.7161861419677734, + "num_tokens": 210028490.0, + "step": 87230 + }, + { + "epoch": 0.7998533052168332, + "learning_rate": 4.0031172641422944e-05, + "loss": 1.0231, + "mean_token_accuracy": 0.6989761531352997, + "num_tokens": 210060393.0, + "step": 87240 + }, + { + "epoch": 0.7999449894563124, + "learning_rate": 4.0012835793527096e-05, + "loss": 0.9493, + "mean_token_accuracy": 0.7177074491977692, + "num_tokens": 210091680.0, + "step": 87250 + }, + { + "epoch": 0.8000366736957917, + "learning_rate": 3.999449894563125e-05, + "loss": 0.9206, + "mean_token_accuracy": 0.7272840738296509, + "num_tokens": 210123428.0, + "step": 87260 + }, + { + "epoch": 0.8001283579352709, + "learning_rate": 3.9976162097735406e-05, + "loss": 0.9429, + "mean_token_accuracy": 0.7239596605300903, + "num_tokens": 210153951.0, + "step": 87270 + }, + { + "epoch": 0.8002200421747502, + "learning_rate": 3.995782524983955e-05, + "loss": 0.9122, + "mean_token_accuracy": 0.7328599035739899, + "num_tokens": 210183418.0, + "step": 87280 + }, + { + "epoch": 0.8003117264142294, + "learning_rate": 3.993948840194371e-05, + "loss": 0.9814, + "mean_token_accuracy": 0.7061148047447204, + "num_tokens": 210212876.0, + "step": 87290 + }, + { + "epoch": 0.8004034106537087, + "learning_rate": 3.992115155404786e-05, + "loss": 0.9947, + "mean_token_accuracy": 0.7061928927898407, + "num_tokens": 210244168.0, + "step": 87300 + }, + { + "epoch": 0.8004950948931878, + "learning_rate": 3.9902814706152014e-05, + "loss": 0.9538, + "mean_token_accuracy": 0.7256619215011597, + "num_tokens": 210275609.0, + "step": 87310 + }, + { + "epoch": 0.8005867791326671, + "learning_rate": 3.988447785825617e-05, + "loss": 0.9519, + "mean_token_accuracy": 0.7208737552165985, + "num_tokens": 210306174.0, + "step": 87320 + }, + { + "epoch": 0.8006784633721463, + "learning_rate": 3.986614101036032e-05, + "loss": 0.9393, + "mean_token_accuracy": 0.7272839725017548, + "num_tokens": 210337464.0, + "step": 87330 + }, + { + "epoch": 0.8007701476116256, + "learning_rate": 3.9847804162464476e-05, + "loss": 0.9365, + "mean_token_accuracy": 0.7243816077709198, + "num_tokens": 210365979.0, + "step": 87340 + }, + { + "epoch": 0.8008618318511048, + "learning_rate": 3.982946731456863e-05, + "loss": 0.9699, + "mean_token_accuracy": 0.7135676264762878, + "num_tokens": 210396758.0, + "step": 87350 + }, + { + "epoch": 0.8009535160905841, + "learning_rate": 3.981113046667278e-05, + "loss": 1.0267, + "mean_token_accuracy": 0.6961562693119049, + "num_tokens": 210428116.0, + "step": 87360 + }, + { + "epoch": 0.8010452003300632, + "learning_rate": 3.979279361877694e-05, + "loss": 0.9412, + "mean_token_accuracy": 0.7198286354541779, + "num_tokens": 210459124.0, + "step": 87370 + }, + { + "epoch": 0.8011368845695425, + "learning_rate": 3.9774456770881083e-05, + "loss": 0.9239, + "mean_token_accuracy": 0.7228979408740998, + "num_tokens": 210489292.0, + "step": 87380 + }, + { + "epoch": 0.8012285688090217, + "learning_rate": 3.975611992298524e-05, + "loss": 0.9269, + "mean_token_accuracy": 0.7259806156158447, + "num_tokens": 210518533.0, + "step": 87390 + }, + { + "epoch": 0.801320253048501, + "learning_rate": 3.9737783075089394e-05, + "loss": 0.948, + "mean_token_accuracy": 0.7187861204147339, + "num_tokens": 210548130.0, + "step": 87400 + }, + { + "epoch": 0.8014119372879802, + "learning_rate": 3.9719446227193546e-05, + "loss": 0.976, + "mean_token_accuracy": 0.7104677975177764, + "num_tokens": 210578522.0, + "step": 87410 + }, + { + "epoch": 0.8015036215274595, + "learning_rate": 3.9701109379297704e-05, + "loss": 1.0142, + "mean_token_accuracy": 0.7038933455944061, + "num_tokens": 210610676.0, + "step": 87420 + }, + { + "epoch": 0.8015953057669387, + "learning_rate": 3.968277253140185e-05, + "loss": 0.9731, + "mean_token_accuracy": 0.7116360366344452, + "num_tokens": 210641489.0, + "step": 87430 + }, + { + "epoch": 0.8016869900064179, + "learning_rate": 3.966443568350601e-05, + "loss": 0.9531, + "mean_token_accuracy": 0.7212050378322601, + "num_tokens": 210672789.0, + "step": 87440 + }, + { + "epoch": 0.8017786742458971, + "learning_rate": 3.964609883561016e-05, + "loss": 0.9566, + "mean_token_accuracy": 0.7202536642551423, + "num_tokens": 210702757.0, + "step": 87450 + }, + { + "epoch": 0.8018703584853764, + "learning_rate": 3.962776198771431e-05, + "loss": 0.9312, + "mean_token_accuracy": 0.7226182639598846, + "num_tokens": 210733530.0, + "step": 87460 + }, + { + "epoch": 0.8019620427248556, + "learning_rate": 3.960942513981847e-05, + "loss": 0.9909, + "mean_token_accuracy": 0.7056439638137817, + "num_tokens": 210764589.0, + "step": 87470 + }, + { + "epoch": 0.8020537269643349, + "learning_rate": 3.9591088291922616e-05, + "loss": 0.9983, + "mean_token_accuracy": 0.707426768541336, + "num_tokens": 210796035.0, + "step": 87480 + }, + { + "epoch": 0.8021454112038141, + "learning_rate": 3.9572751444026774e-05, + "loss": 0.9138, + "mean_token_accuracy": 0.7283466637134552, + "num_tokens": 210827490.0, + "step": 87490 + }, + { + "epoch": 0.8022370954432932, + "learning_rate": 3.9554414596130926e-05, + "loss": 0.9406, + "mean_token_accuracy": 0.7218400359153747, + "num_tokens": 210859404.0, + "step": 87500 + }, + { + "epoch": 0.8023287796827725, + "learning_rate": 3.953607774823508e-05, + "loss": 0.9397, + "mean_token_accuracy": 0.7297419905662537, + "num_tokens": 210888658.0, + "step": 87510 + }, + { + "epoch": 0.8024204639222517, + "learning_rate": 3.951774090033924e-05, + "loss": 0.9209, + "mean_token_accuracy": 0.72423837184906, + "num_tokens": 210919037.0, + "step": 87520 + }, + { + "epoch": 0.802512148161731, + "learning_rate": 3.949940405244339e-05, + "loss": 0.9985, + "mean_token_accuracy": 0.7135941743850708, + "num_tokens": 210949611.0, + "step": 87530 + }, + { + "epoch": 0.8026038324012102, + "learning_rate": 3.948106720454754e-05, + "loss": 1.0144, + "mean_token_accuracy": 0.7023302793502808, + "num_tokens": 210981073.0, + "step": 87540 + }, + { + "epoch": 0.8026955166406895, + "learning_rate": 3.946273035665169e-05, + "loss": 0.9583, + "mean_token_accuracy": 0.7169875621795654, + "num_tokens": 211012249.0, + "step": 87550 + }, + { + "epoch": 0.8027872008801687, + "learning_rate": 3.9444393508755844e-05, + "loss": 0.9546, + "mean_token_accuracy": 0.7173968315124511, + "num_tokens": 211042131.0, + "step": 87560 + }, + { + "epoch": 0.8028788851196479, + "learning_rate": 3.942605666086e-05, + "loss": 0.965, + "mean_token_accuracy": 0.7187240719795227, + "num_tokens": 211072035.0, + "step": 87570 + }, + { + "epoch": 0.8029705693591271, + "learning_rate": 3.9407719812964155e-05, + "loss": 0.954, + "mean_token_accuracy": 0.7188745498657226, + "num_tokens": 211102200.0, + "step": 87580 + }, + { + "epoch": 0.8030622535986064, + "learning_rate": 3.9389382965068307e-05, + "loss": 1.0042, + "mean_token_accuracy": 0.7035655081272125, + "num_tokens": 211132455.0, + "step": 87590 + }, + { + "epoch": 0.8031539378380856, + "learning_rate": 3.937104611717246e-05, + "loss": 1.0106, + "mean_token_accuracy": 0.7055139124393464, + "num_tokens": 211164525.0, + "step": 87600 + }, + { + "epoch": 0.8032456220775649, + "learning_rate": 3.935270926927661e-05, + "loss": 0.919, + "mean_token_accuracy": 0.7271938025951385, + "num_tokens": 211194734.0, + "step": 87610 + }, + { + "epoch": 0.8033373063170441, + "learning_rate": 3.933437242138077e-05, + "loss": 0.9212, + "mean_token_accuracy": 0.7250953376293182, + "num_tokens": 211225827.0, + "step": 87620 + }, + { + "epoch": 0.8034289905565233, + "learning_rate": 3.931603557348492e-05, + "loss": 0.9497, + "mean_token_accuracy": 0.719471538066864, + "num_tokens": 211255154.0, + "step": 87630 + }, + { + "epoch": 0.8035206747960025, + "learning_rate": 3.929769872558907e-05, + "loss": 0.9396, + "mean_token_accuracy": 0.7259688198566436, + "num_tokens": 211284628.0, + "step": 87640 + }, + { + "epoch": 0.8036123590354818, + "learning_rate": 3.9279361877693225e-05, + "loss": 0.9453, + "mean_token_accuracy": 0.7172414362430573, + "num_tokens": 211315715.0, + "step": 87650 + }, + { + "epoch": 0.803704043274961, + "learning_rate": 3.9261025029797376e-05, + "loss": 1.0265, + "mean_token_accuracy": 0.696022343635559, + "num_tokens": 211346988.0, + "step": 87660 + }, + { + "epoch": 0.8037957275144403, + "learning_rate": 3.9242688181901535e-05, + "loss": 0.9324, + "mean_token_accuracy": 0.7222636938095093, + "num_tokens": 211378233.0, + "step": 87670 + }, + { + "epoch": 0.8038874117539195, + "learning_rate": 3.922435133400569e-05, + "loss": 0.9872, + "mean_token_accuracy": 0.7116622984409332, + "num_tokens": 211408954.0, + "step": 87680 + }, + { + "epoch": 0.8039790959933988, + "learning_rate": 3.920601448610984e-05, + "loss": 0.9102, + "mean_token_accuracy": 0.7304248034954071, + "num_tokens": 211437232.0, + "step": 87690 + }, + { + "epoch": 0.8040707802328779, + "learning_rate": 3.918767763821399e-05, + "loss": 0.9743, + "mean_token_accuracy": 0.7167141556739807, + "num_tokens": 211469487.0, + "step": 87700 + }, + { + "epoch": 0.8041624644723572, + "learning_rate": 3.916934079031815e-05, + "loss": 1.0197, + "mean_token_accuracy": 0.7021766901016235, + "num_tokens": 211499026.0, + "step": 87710 + }, + { + "epoch": 0.8042541487118364, + "learning_rate": 3.91510039424223e-05, + "loss": 1.0043, + "mean_token_accuracy": 0.7064680993556977, + "num_tokens": 211531472.0, + "step": 87720 + }, + { + "epoch": 0.8043458329513157, + "learning_rate": 3.913266709452645e-05, + "loss": 0.9211, + "mean_token_accuracy": 0.7292511284351348, + "num_tokens": 211562880.0, + "step": 87730 + }, + { + "epoch": 0.8044375171907949, + "learning_rate": 3.9114330246630605e-05, + "loss": 0.9782, + "mean_token_accuracy": 0.7146872460842133, + "num_tokens": 211594193.0, + "step": 87740 + }, + { + "epoch": 0.8045292014302742, + "learning_rate": 3.909599339873476e-05, + "loss": 0.918, + "mean_token_accuracy": 0.7276806056499481, + "num_tokens": 211624063.0, + "step": 87750 + }, + { + "epoch": 0.8046208856697533, + "learning_rate": 3.9077656550838915e-05, + "loss": 0.994, + "mean_token_accuracy": 0.7086891889572143, + "num_tokens": 211655049.0, + "step": 87760 + }, + { + "epoch": 0.8047125699092326, + "learning_rate": 3.905931970294307e-05, + "loss": 1.0015, + "mean_token_accuracy": 0.7083421170711517, + "num_tokens": 211685571.0, + "step": 87770 + }, + { + "epoch": 0.8048042541487118, + "learning_rate": 3.904098285504722e-05, + "loss": 1.0112, + "mean_token_accuracy": 0.704827344417572, + "num_tokens": 211717536.0, + "step": 87780 + }, + { + "epoch": 0.8048959383881911, + "learning_rate": 3.902264600715137e-05, + "loss": 0.988, + "mean_token_accuracy": 0.7118992805480957, + "num_tokens": 211748833.0, + "step": 87790 + }, + { + "epoch": 0.8049876226276703, + "learning_rate": 3.900430915925552e-05, + "loss": 0.9308, + "mean_token_accuracy": 0.723883455991745, + "num_tokens": 211779141.0, + "step": 87800 + }, + { + "epoch": 0.8050793068671496, + "learning_rate": 3.898597231135968e-05, + "loss": 0.8952, + "mean_token_accuracy": 0.7299412369728089, + "num_tokens": 211809033.0, + "step": 87810 + }, + { + "epoch": 0.8051709911066288, + "learning_rate": 3.896763546346383e-05, + "loss": 0.9067, + "mean_token_accuracy": 0.7267274975776672, + "num_tokens": 211837328.0, + "step": 87820 + }, + { + "epoch": 0.805262675346108, + "learning_rate": 3.8949298615567985e-05, + "loss": 0.9796, + "mean_token_accuracy": 0.7142065763473511, + "num_tokens": 211869504.0, + "step": 87830 + }, + { + "epoch": 0.8053543595855872, + "learning_rate": 3.8930961767672144e-05, + "loss": 0.9873, + "mean_token_accuracy": 0.7059406995773315, + "num_tokens": 211900504.0, + "step": 87840 + }, + { + "epoch": 0.8054460438250665, + "learning_rate": 3.891262491977629e-05, + "loss": 1.0178, + "mean_token_accuracy": 0.6987842381000519, + "num_tokens": 211932474.0, + "step": 87850 + }, + { + "epoch": 0.8055377280645457, + "learning_rate": 3.889428807188045e-05, + "loss": 0.9856, + "mean_token_accuracy": 0.7069795370101929, + "num_tokens": 211962924.0, + "step": 87860 + }, + { + "epoch": 0.805629412304025, + "learning_rate": 3.88759512239846e-05, + "loss": 1.0099, + "mean_token_accuracy": 0.7000271320343018, + "num_tokens": 211993217.0, + "step": 87870 + }, + { + "epoch": 0.8057210965435042, + "learning_rate": 3.885761437608875e-05, + "loss": 0.915, + "mean_token_accuracy": 0.7269558608531952, + "num_tokens": 212021789.0, + "step": 87880 + }, + { + "epoch": 0.8058127807829834, + "learning_rate": 3.883927752819291e-05, + "loss": 0.9503, + "mean_token_accuracy": 0.7160397291183471, + "num_tokens": 212052730.0, + "step": 87890 + }, + { + "epoch": 0.8059044650224626, + "learning_rate": 3.8820940680297055e-05, + "loss": 0.9924, + "mean_token_accuracy": 0.7088140308856964, + "num_tokens": 212084561.0, + "step": 87900 + }, + { + "epoch": 0.8059961492619419, + "learning_rate": 3.8802603832401214e-05, + "loss": 0.9428, + "mean_token_accuracy": 0.7223440527915954, + "num_tokens": 212115883.0, + "step": 87910 + }, + { + "epoch": 0.8060878335014211, + "learning_rate": 3.8784266984505366e-05, + "loss": 0.9776, + "mean_token_accuracy": 0.7104128360748291, + "num_tokens": 212147656.0, + "step": 87920 + }, + { + "epoch": 0.8061795177409004, + "learning_rate": 3.876593013660952e-05, + "loss": 0.992, + "mean_token_accuracy": 0.7046168982982636, + "num_tokens": 212177902.0, + "step": 87930 + }, + { + "epoch": 0.8062712019803796, + "learning_rate": 3.8747593288713676e-05, + "loss": 0.9981, + "mean_token_accuracy": 0.7021388173103332, + "num_tokens": 212208062.0, + "step": 87940 + }, + { + "epoch": 0.8063628862198589, + "learning_rate": 3.872925644081782e-05, + "loss": 0.9651, + "mean_token_accuracy": 0.7151989221572876, + "num_tokens": 212236622.0, + "step": 87950 + }, + { + "epoch": 0.806454570459338, + "learning_rate": 3.871091959292198e-05, + "loss": 1.0139, + "mean_token_accuracy": 0.702283525466919, + "num_tokens": 212267305.0, + "step": 87960 + }, + { + "epoch": 0.8065462546988172, + "learning_rate": 3.869258274502613e-05, + "loss": 0.9738, + "mean_token_accuracy": 0.7131257295608521, + "num_tokens": 212298509.0, + "step": 87970 + }, + { + "epoch": 0.8066379389382965, + "learning_rate": 3.8674245897130284e-05, + "loss": 0.9946, + "mean_token_accuracy": 0.7092668652534485, + "num_tokens": 212329561.0, + "step": 87980 + }, + { + "epoch": 0.8067296231777757, + "learning_rate": 3.865590904923444e-05, + "loss": 0.9438, + "mean_token_accuracy": 0.7176726818084717, + "num_tokens": 212359206.0, + "step": 87990 + }, + { + "epoch": 0.806821307417255, + "learning_rate": 3.863757220133859e-05, + "loss": 1.015, + "mean_token_accuracy": 0.7055783033370971, + "num_tokens": 212390480.0, + "step": 88000 + }, + { + "epoch": 0.8069129916567342, + "learning_rate": 3.8619235353442746e-05, + "loss": 0.9686, + "mean_token_accuracy": 0.7132801949977875, + "num_tokens": 212421124.0, + "step": 88010 + }, + { + "epoch": 0.8070046758962134, + "learning_rate": 3.86008985055469e-05, + "loss": 1.0125, + "mean_token_accuracy": 0.6998761415481567, + "num_tokens": 212451158.0, + "step": 88020 + }, + { + "epoch": 0.8070963601356926, + "learning_rate": 3.858256165765105e-05, + "loss": 0.9471, + "mean_token_accuracy": 0.7199070811271667, + "num_tokens": 212480837.0, + "step": 88030 + }, + { + "epoch": 0.8071880443751719, + "learning_rate": 3.856422480975521e-05, + "loss": 1.0048, + "mean_token_accuracy": 0.707367992401123, + "num_tokens": 212511966.0, + "step": 88040 + }, + { + "epoch": 0.8072797286146511, + "learning_rate": 3.8545887961859353e-05, + "loss": 0.9472, + "mean_token_accuracy": 0.7156034588813782, + "num_tokens": 212541582.0, + "step": 88050 + }, + { + "epoch": 0.8073714128541304, + "learning_rate": 3.852755111396351e-05, + "loss": 1.0048, + "mean_token_accuracy": 0.7002568304538727, + "num_tokens": 212572851.0, + "step": 88060 + }, + { + "epoch": 0.8074630970936096, + "learning_rate": 3.8509214266067664e-05, + "loss": 0.9805, + "mean_token_accuracy": 0.711814159154892, + "num_tokens": 212601763.0, + "step": 88070 + }, + { + "epoch": 0.8075547813330889, + "learning_rate": 3.8490877418171816e-05, + "loss": 1.0326, + "mean_token_accuracy": 0.6988707661628724, + "num_tokens": 212633133.0, + "step": 88080 + }, + { + "epoch": 0.807646465572568, + "learning_rate": 3.8472540570275974e-05, + "loss": 1.012, + "mean_token_accuracy": 0.7042496144771576, + "num_tokens": 212665040.0, + "step": 88090 + }, + { + "epoch": 0.8077381498120473, + "learning_rate": 3.845420372238012e-05, + "loss": 0.9293, + "mean_token_accuracy": 0.7194316208362579, + "num_tokens": 212694268.0, + "step": 88100 + }, + { + "epoch": 0.8078298340515265, + "learning_rate": 3.843586687448428e-05, + "loss": 1.0078, + "mean_token_accuracy": 0.7069931268692017, + "num_tokens": 212725343.0, + "step": 88110 + }, + { + "epoch": 0.8079215182910058, + "learning_rate": 3.841753002658843e-05, + "loss": 0.9689, + "mean_token_accuracy": 0.708724421262741, + "num_tokens": 212757430.0, + "step": 88120 + }, + { + "epoch": 0.808013202530485, + "learning_rate": 3.839919317869258e-05, + "loss": 1.0366, + "mean_token_accuracy": 0.6936649978160858, + "num_tokens": 212785740.0, + "step": 88130 + }, + { + "epoch": 0.8081048867699643, + "learning_rate": 3.838085633079674e-05, + "loss": 1.0409, + "mean_token_accuracy": 0.6952789068222046, + "num_tokens": 212815872.0, + "step": 88140 + }, + { + "epoch": 0.8081965710094435, + "learning_rate": 3.836251948290089e-05, + "loss": 1.0242, + "mean_token_accuracy": 0.7023537755012512, + "num_tokens": 212847005.0, + "step": 88150 + }, + { + "epoch": 0.8082882552489227, + "learning_rate": 3.8344182635005044e-05, + "loss": 1.0176, + "mean_token_accuracy": 0.7029186666011811, + "num_tokens": 212879746.0, + "step": 88160 + }, + { + "epoch": 0.8083799394884019, + "learning_rate": 3.8325845787109196e-05, + "loss": 1.0404, + "mean_token_accuracy": 0.7016336560249329, + "num_tokens": 212910525.0, + "step": 88170 + }, + { + "epoch": 0.8084716237278812, + "learning_rate": 3.830750893921335e-05, + "loss": 0.9744, + "mean_token_accuracy": 0.7135962665081024, + "num_tokens": 212940403.0, + "step": 88180 + }, + { + "epoch": 0.8085633079673604, + "learning_rate": 3.828917209131751e-05, + "loss": 0.9793, + "mean_token_accuracy": 0.710008054971695, + "num_tokens": 212971219.0, + "step": 88190 + }, + { + "epoch": 0.8086549922068397, + "learning_rate": 3.827083524342166e-05, + "loss": 1.0374, + "mean_token_accuracy": 0.693979698419571, + "num_tokens": 213001472.0, + "step": 88200 + }, + { + "epoch": 0.8087466764463189, + "learning_rate": 3.825249839552581e-05, + "loss": 1.0347, + "mean_token_accuracy": 0.6930490970611572, + "num_tokens": 213032740.0, + "step": 88210 + }, + { + "epoch": 0.8088383606857981, + "learning_rate": 3.823416154762996e-05, + "loss": 0.9726, + "mean_token_accuracy": 0.7108381807804107, + "num_tokens": 213064307.0, + "step": 88220 + }, + { + "epoch": 0.8089300449252773, + "learning_rate": 3.8215824699734114e-05, + "loss": 1.0181, + "mean_token_accuracy": 0.7040467023849487, + "num_tokens": 213095133.0, + "step": 88230 + }, + { + "epoch": 0.8090217291647566, + "learning_rate": 3.819748785183827e-05, + "loss": 0.99, + "mean_token_accuracy": 0.7062864422798156, + "num_tokens": 213125845.0, + "step": 88240 + }, + { + "epoch": 0.8091134134042358, + "learning_rate": 3.8179151003942425e-05, + "loss": 1.0044, + "mean_token_accuracy": 0.7024176120758057, + "num_tokens": 213155881.0, + "step": 88250 + }, + { + "epoch": 0.8092050976437151, + "learning_rate": 3.8160814156046577e-05, + "loss": 1.0466, + "mean_token_accuracy": 0.6926968991756439, + "num_tokens": 213187092.0, + "step": 88260 + }, + { + "epoch": 0.8092967818831943, + "learning_rate": 3.814247730815073e-05, + "loss": 1.0012, + "mean_token_accuracy": 0.7008063197135925, + "num_tokens": 213218664.0, + "step": 88270 + }, + { + "epoch": 0.8093884661226736, + "learning_rate": 3.812414046025488e-05, + "loss": 1.0249, + "mean_token_accuracy": 0.7034690320491791, + "num_tokens": 213250393.0, + "step": 88280 + }, + { + "epoch": 0.8094801503621527, + "learning_rate": 3.810580361235904e-05, + "loss": 0.9598, + "mean_token_accuracy": 0.7189905226230622, + "num_tokens": 213281184.0, + "step": 88290 + }, + { + "epoch": 0.809571834601632, + "learning_rate": 3.808746676446319e-05, + "loss": 0.9845, + "mean_token_accuracy": 0.7038617312908173, + "num_tokens": 213312259.0, + "step": 88300 + }, + { + "epoch": 0.8096635188411112, + "learning_rate": 3.806912991656734e-05, + "loss": 0.9706, + "mean_token_accuracy": 0.7138518333435059, + "num_tokens": 213341191.0, + "step": 88310 + }, + { + "epoch": 0.8097552030805905, + "learning_rate": 3.8050793068671495e-05, + "loss": 1.0368, + "mean_token_accuracy": 0.6929193556308746, + "num_tokens": 213372392.0, + "step": 88320 + }, + { + "epoch": 0.8098468873200697, + "learning_rate": 3.803245622077565e-05, + "loss": 0.9991, + "mean_token_accuracy": 0.7051734685897827, + "num_tokens": 213403814.0, + "step": 88330 + }, + { + "epoch": 0.809938571559549, + "learning_rate": 3.8014119372879805e-05, + "loss": 1.0016, + "mean_token_accuracy": 0.7056295692920684, + "num_tokens": 213436675.0, + "step": 88340 + }, + { + "epoch": 0.8100302557990281, + "learning_rate": 3.799578252498396e-05, + "loss": 0.9922, + "mean_token_accuracy": 0.710987263917923, + "num_tokens": 213466825.0, + "step": 88350 + }, + { + "epoch": 0.8101219400385073, + "learning_rate": 3.797744567708811e-05, + "loss": 0.9356, + "mean_token_accuracy": 0.7210259854793548, + "num_tokens": 213496287.0, + "step": 88360 + }, + { + "epoch": 0.8102136242779866, + "learning_rate": 3.795910882919226e-05, + "loss": 1.0192, + "mean_token_accuracy": 0.7016069829463959, + "num_tokens": 213528028.0, + "step": 88370 + }, + { + "epoch": 0.8103053085174658, + "learning_rate": 3.794077198129642e-05, + "loss": 1.0424, + "mean_token_accuracy": 0.6924838542938232, + "num_tokens": 213558841.0, + "step": 88380 + }, + { + "epoch": 0.8103969927569451, + "learning_rate": 3.792243513340057e-05, + "loss": 1.028, + "mean_token_accuracy": 0.6980836987495422, + "num_tokens": 213589731.0, + "step": 88390 + }, + { + "epoch": 0.8104886769964244, + "learning_rate": 3.790409828550472e-05, + "loss": 1.0422, + "mean_token_accuracy": 0.6992207884788513, + "num_tokens": 213622145.0, + "step": 88400 + }, + { + "epoch": 0.8105803612359036, + "learning_rate": 3.7885761437608875e-05, + "loss": 1.0096, + "mean_token_accuracy": 0.7027938604354859, + "num_tokens": 213653104.0, + "step": 88410 + }, + { + "epoch": 0.8106720454753827, + "learning_rate": 3.786742458971303e-05, + "loss": 0.9938, + "mean_token_accuracy": 0.7057611823081971, + "num_tokens": 213683900.0, + "step": 88420 + }, + { + "epoch": 0.810763729714862, + "learning_rate": 3.7849087741817185e-05, + "loss": 1.0263, + "mean_token_accuracy": 0.7007830560207366, + "num_tokens": 213713769.0, + "step": 88430 + }, + { + "epoch": 0.8108554139543412, + "learning_rate": 3.783075089392134e-05, + "loss": 1.0262, + "mean_token_accuracy": 0.6971380650997162, + "num_tokens": 213744230.0, + "step": 88440 + }, + { + "epoch": 0.8109470981938205, + "learning_rate": 3.781241404602549e-05, + "loss": 1.0232, + "mean_token_accuracy": 0.7045233488082886, + "num_tokens": 213776054.0, + "step": 88450 + }, + { + "epoch": 0.8110387824332997, + "learning_rate": 3.779407719812965e-05, + "loss": 1.026, + "mean_token_accuracy": 0.7000523269176483, + "num_tokens": 213807639.0, + "step": 88460 + }, + { + "epoch": 0.811130466672779, + "learning_rate": 3.777574035023379e-05, + "loss": 0.9708, + "mean_token_accuracy": 0.7135145664215088, + "num_tokens": 213838473.0, + "step": 88470 + }, + { + "epoch": 0.8112221509122581, + "learning_rate": 3.775740350233795e-05, + "loss": 1.0188, + "mean_token_accuracy": 0.70450279712677, + "num_tokens": 213869075.0, + "step": 88480 + }, + { + "epoch": 0.8113138351517374, + "learning_rate": 3.77390666544421e-05, + "loss": 1.0109, + "mean_token_accuracy": 0.7031781196594238, + "num_tokens": 213899235.0, + "step": 88490 + }, + { + "epoch": 0.8114055193912166, + "learning_rate": 3.7720729806546255e-05, + "loss": 1.0088, + "mean_token_accuracy": 0.699275553226471, + "num_tokens": 213930406.0, + "step": 88500 + }, + { + "epoch": 0.8114972036306959, + "learning_rate": 3.7702392958650414e-05, + "loss": 1.0298, + "mean_token_accuracy": 0.7035545229911804, + "num_tokens": 213961438.0, + "step": 88510 + }, + { + "epoch": 0.8115888878701751, + "learning_rate": 3.768405611075456e-05, + "loss": 1.0406, + "mean_token_accuracy": 0.7002984166145325, + "num_tokens": 213994024.0, + "step": 88520 + }, + { + "epoch": 0.8116805721096544, + "learning_rate": 3.766571926285872e-05, + "loss": 1.0164, + "mean_token_accuracy": 0.6988596498966217, + "num_tokens": 214025254.0, + "step": 88530 + }, + { + "epoch": 0.8117722563491336, + "learning_rate": 3.764738241496287e-05, + "loss": 0.9976, + "mean_token_accuracy": 0.7057909548282624, + "num_tokens": 214054777.0, + "step": 88540 + }, + { + "epoch": 0.8118639405886128, + "learning_rate": 3.762904556706702e-05, + "loss": 1.0154, + "mean_token_accuracy": 0.6962915360927582, + "num_tokens": 214085391.0, + "step": 88550 + }, + { + "epoch": 0.811955624828092, + "learning_rate": 3.761070871917118e-05, + "loss": 1.0146, + "mean_token_accuracy": 0.7051073789596558, + "num_tokens": 214115470.0, + "step": 88560 + }, + { + "epoch": 0.8120473090675713, + "learning_rate": 3.7592371871275325e-05, + "loss": 0.9843, + "mean_token_accuracy": 0.7093298554420471, + "num_tokens": 214147881.0, + "step": 88570 + }, + { + "epoch": 0.8121389933070505, + "learning_rate": 3.7574035023379484e-05, + "loss": 1.0514, + "mean_token_accuracy": 0.6973120331764221, + "num_tokens": 214178899.0, + "step": 88580 + }, + { + "epoch": 0.8122306775465298, + "learning_rate": 3.7555698175483636e-05, + "loss": 1.0301, + "mean_token_accuracy": 0.6959855020046234, + "num_tokens": 214210317.0, + "step": 88590 + }, + { + "epoch": 0.812322361786009, + "learning_rate": 3.753736132758779e-05, + "loss": 1.0216, + "mean_token_accuracy": 0.6968937814235687, + "num_tokens": 214240586.0, + "step": 88600 + }, + { + "epoch": 0.8124140460254882, + "learning_rate": 3.7519024479691946e-05, + "loss": 1.0107, + "mean_token_accuracy": 0.7076817810535431, + "num_tokens": 214270481.0, + "step": 88610 + }, + { + "epoch": 0.8125057302649674, + "learning_rate": 3.750068763179609e-05, + "loss": 1.0213, + "mean_token_accuracy": 0.7024851560592651, + "num_tokens": 214301220.0, + "step": 88620 + }, + { + "epoch": 0.8125974145044467, + "learning_rate": 3.748235078390025e-05, + "loss": 0.9704, + "mean_token_accuracy": 0.7130574345588684, + "num_tokens": 214332446.0, + "step": 88630 + }, + { + "epoch": 0.8126890987439259, + "learning_rate": 3.746401393600441e-05, + "loss": 1.011, + "mean_token_accuracy": 0.7014073669910431, + "num_tokens": 214363295.0, + "step": 88640 + }, + { + "epoch": 0.8127807829834052, + "learning_rate": 3.7445677088108554e-05, + "loss": 1.0504, + "mean_token_accuracy": 0.6962876319885254, + "num_tokens": 214396536.0, + "step": 88650 + }, + { + "epoch": 0.8128724672228844, + "learning_rate": 3.742734024021271e-05, + "loss": 1.0115, + "mean_token_accuracy": 0.6957520246505737, + "num_tokens": 214427161.0, + "step": 88660 + }, + { + "epoch": 0.8129641514623637, + "learning_rate": 3.740900339231686e-05, + "loss": 0.9785, + "mean_token_accuracy": 0.7070945560932159, + "num_tokens": 214456377.0, + "step": 88670 + }, + { + "epoch": 0.8130558357018428, + "learning_rate": 3.7390666544421016e-05, + "loss": 1.0255, + "mean_token_accuracy": 0.6996080458164216, + "num_tokens": 214488332.0, + "step": 88680 + }, + { + "epoch": 0.8131475199413221, + "learning_rate": 3.7372329696525175e-05, + "loss": 1.0398, + "mean_token_accuracy": 0.6954891562461853, + "num_tokens": 214520267.0, + "step": 88690 + }, + { + "epoch": 0.8132392041808013, + "learning_rate": 3.735399284862932e-05, + "loss": 1.0084, + "mean_token_accuracy": 0.6975082814693451, + "num_tokens": 214551572.0, + "step": 88700 + }, + { + "epoch": 0.8133308884202806, + "learning_rate": 3.733565600073348e-05, + "loss": 0.9864, + "mean_token_accuracy": 0.7096741735935211, + "num_tokens": 214581318.0, + "step": 88710 + }, + { + "epoch": 0.8134225726597598, + "learning_rate": 3.7317319152837623e-05, + "loss": 0.9964, + "mean_token_accuracy": 0.7107142269611358, + "num_tokens": 214612112.0, + "step": 88720 + }, + { + "epoch": 0.8135142568992391, + "learning_rate": 3.729898230494178e-05, + "loss": 1.0236, + "mean_token_accuracy": 0.7034564018249512, + "num_tokens": 214643725.0, + "step": 88730 + }, + { + "epoch": 0.8136059411387182, + "learning_rate": 3.728064545704594e-05, + "loss": 1.0077, + "mean_token_accuracy": 0.6969237089157104, + "num_tokens": 214673828.0, + "step": 88740 + }, + { + "epoch": 0.8136976253781975, + "learning_rate": 3.7262308609150086e-05, + "loss": 0.9537, + "mean_token_accuracy": 0.7197325646877288, + "num_tokens": 214704474.0, + "step": 88750 + }, + { + "epoch": 0.8137893096176767, + "learning_rate": 3.7243971761254244e-05, + "loss": 0.9941, + "mean_token_accuracy": 0.7051733493804931, + "num_tokens": 214736266.0, + "step": 88760 + }, + { + "epoch": 0.813880993857156, + "learning_rate": 3.7225634913358396e-05, + "loss": 1.0042, + "mean_token_accuracy": 0.7060157775878906, + "num_tokens": 214768187.0, + "step": 88770 + }, + { + "epoch": 0.8139726780966352, + "learning_rate": 3.720729806546255e-05, + "loss": 1.043, + "mean_token_accuracy": 0.6956783473491669, + "num_tokens": 214798631.0, + "step": 88780 + }, + { + "epoch": 0.8140643623361145, + "learning_rate": 3.718896121756671e-05, + "loss": 0.965, + "mean_token_accuracy": 0.7153402268886566, + "num_tokens": 214827238.0, + "step": 88790 + }, + { + "epoch": 0.8141560465755937, + "learning_rate": 3.717062436967085e-05, + "loss": 1.0014, + "mean_token_accuracy": 0.7031769633293152, + "num_tokens": 214857982.0, + "step": 88800 + }, + { + "epoch": 0.8142477308150728, + "learning_rate": 3.715228752177501e-05, + "loss": 1.0093, + "mean_token_accuracy": 0.7037087738513946, + "num_tokens": 214888607.0, + "step": 88810 + }, + { + "epoch": 0.8143394150545521, + "learning_rate": 3.713395067387916e-05, + "loss": 0.9918, + "mean_token_accuracy": 0.7101965010166168, + "num_tokens": 214919555.0, + "step": 88820 + }, + { + "epoch": 0.8144310992940313, + "learning_rate": 3.7115613825983314e-05, + "loss": 1.0026, + "mean_token_accuracy": 0.7070383369922638, + "num_tokens": 214950616.0, + "step": 88830 + }, + { + "epoch": 0.8145227835335106, + "learning_rate": 3.709727697808747e-05, + "loss": 1.0025, + "mean_token_accuracy": 0.7008816838264466, + "num_tokens": 214981063.0, + "step": 88840 + }, + { + "epoch": 0.8146144677729898, + "learning_rate": 3.707894013019162e-05, + "loss": 1.0292, + "mean_token_accuracy": 0.6949926257133484, + "num_tokens": 215011461.0, + "step": 88850 + }, + { + "epoch": 0.8147061520124691, + "learning_rate": 3.706060328229578e-05, + "loss": 1.0562, + "mean_token_accuracy": 0.6896575272083283, + "num_tokens": 215042214.0, + "step": 88860 + }, + { + "epoch": 0.8147978362519482, + "learning_rate": 3.704226643439993e-05, + "loss": 1.0016, + "mean_token_accuracy": 0.7054397463798523, + "num_tokens": 215072638.0, + "step": 88870 + }, + { + "epoch": 0.8148895204914275, + "learning_rate": 3.702392958650408e-05, + "loss": 0.9907, + "mean_token_accuracy": 0.7066368162631989, + "num_tokens": 215102781.0, + "step": 88880 + }, + { + "epoch": 0.8149812047309067, + "learning_rate": 3.700559273860824e-05, + "loss": 1.0176, + "mean_token_accuracy": 0.6987467110157013, + "num_tokens": 215134156.0, + "step": 88890 + }, + { + "epoch": 0.815072888970386, + "learning_rate": 3.6987255890712384e-05, + "loss": 0.9487, + "mean_token_accuracy": 0.7208304941654206, + "num_tokens": 215163529.0, + "step": 88900 + }, + { + "epoch": 0.8151645732098652, + "learning_rate": 3.696891904281654e-05, + "loss": 1.0128, + "mean_token_accuracy": 0.696195912361145, + "num_tokens": 215193480.0, + "step": 88910 + }, + { + "epoch": 0.8152562574493445, + "learning_rate": 3.6950582194920695e-05, + "loss": 1.0287, + "mean_token_accuracy": 0.6967327237129212, + "num_tokens": 215223621.0, + "step": 88920 + }, + { + "epoch": 0.8153479416888237, + "learning_rate": 3.6932245347024847e-05, + "loss": 1.0166, + "mean_token_accuracy": 0.7003809750080109, + "num_tokens": 215255584.0, + "step": 88930 + }, + { + "epoch": 0.8154396259283029, + "learning_rate": 3.6913908499129005e-05, + "loss": 1.0066, + "mean_token_accuracy": 0.7073103427886963, + "num_tokens": 215288761.0, + "step": 88940 + }, + { + "epoch": 0.8155313101677821, + "learning_rate": 3.689557165123316e-05, + "loss": 1.0326, + "mean_token_accuracy": 0.6977166712284089, + "num_tokens": 215320455.0, + "step": 88950 + }, + { + "epoch": 0.8156229944072614, + "learning_rate": 3.687723480333731e-05, + "loss": 0.9917, + "mean_token_accuracy": 0.7111059904098511, + "num_tokens": 215350223.0, + "step": 88960 + }, + { + "epoch": 0.8157146786467406, + "learning_rate": 3.685889795544146e-05, + "loss": 0.9994, + "mean_token_accuracy": 0.7083847284317016, + "num_tokens": 215379750.0, + "step": 88970 + }, + { + "epoch": 0.8158063628862199, + "learning_rate": 3.684056110754561e-05, + "loss": 1.0133, + "mean_token_accuracy": 0.704751193523407, + "num_tokens": 215409774.0, + "step": 88980 + }, + { + "epoch": 0.8158980471256991, + "learning_rate": 3.682222425964977e-05, + "loss": 1.0352, + "mean_token_accuracy": 0.6992090284824372, + "num_tokens": 215441878.0, + "step": 88990 + }, + { + "epoch": 0.8159897313651783, + "learning_rate": 3.680388741175392e-05, + "loss": 1.0072, + "mean_token_accuracy": 0.7007029592990875, + "num_tokens": 215473840.0, + "step": 89000 + }, + { + "epoch": 0.8160814156046575, + "learning_rate": 3.6785550563858075e-05, + "loss": 1.0101, + "mean_token_accuracy": 0.7076938152313232, + "num_tokens": 215505306.0, + "step": 89010 + }, + { + "epoch": 0.8161730998441368, + "learning_rate": 3.676721371596223e-05, + "loss": 0.9989, + "mean_token_accuracy": 0.7039797902107239, + "num_tokens": 215536470.0, + "step": 89020 + }, + { + "epoch": 0.816264784083616, + "learning_rate": 3.674887686806638e-05, + "loss": 0.9962, + "mean_token_accuracy": 0.7050273239612579, + "num_tokens": 215568089.0, + "step": 89030 + }, + { + "epoch": 0.8163564683230953, + "learning_rate": 3.673054002017054e-05, + "loss": 1.0111, + "mean_token_accuracy": 0.705344295501709, + "num_tokens": 215597927.0, + "step": 89040 + }, + { + "epoch": 0.8164481525625745, + "learning_rate": 3.671220317227469e-05, + "loss": 1.0453, + "mean_token_accuracy": 0.6925242125988007, + "num_tokens": 215628923.0, + "step": 89050 + }, + { + "epoch": 0.8165398368020538, + "learning_rate": 3.669386632437884e-05, + "loss": 1.0501, + "mean_token_accuracy": 0.6919217348098755, + "num_tokens": 215660744.0, + "step": 89060 + }, + { + "epoch": 0.8166315210415329, + "learning_rate": 3.667552947648299e-05, + "loss": 0.9929, + "mean_token_accuracy": 0.7100502789020539, + "num_tokens": 215691789.0, + "step": 89070 + }, + { + "epoch": 0.8167232052810122, + "learning_rate": 3.665719262858715e-05, + "loss": 0.9895, + "mean_token_accuracy": 0.705121123790741, + "num_tokens": 215721524.0, + "step": 89080 + }, + { + "epoch": 0.8168148895204914, + "learning_rate": 3.6638855780691303e-05, + "loss": 1.0218, + "mean_token_accuracy": 0.6980223894119263, + "num_tokens": 215752607.0, + "step": 89090 + }, + { + "epoch": 0.8169065737599707, + "learning_rate": 3.6620518932795455e-05, + "loss": 1.0035, + "mean_token_accuracy": 0.7023726284503937, + "num_tokens": 215782477.0, + "step": 89100 + }, + { + "epoch": 0.8169982579994499, + "learning_rate": 3.660218208489961e-05, + "loss": 1.0128, + "mean_token_accuracy": 0.7043716669082641, + "num_tokens": 215814852.0, + "step": 89110 + }, + { + "epoch": 0.8170899422389292, + "learning_rate": 3.658384523700376e-05, + "loss": 1.0231, + "mean_token_accuracy": 0.6985966920852661, + "num_tokens": 215846160.0, + "step": 89120 + }, + { + "epoch": 0.8171816264784083, + "learning_rate": 3.656550838910792e-05, + "loss": 0.9957, + "mean_token_accuracy": 0.7034257829189301, + "num_tokens": 215877751.0, + "step": 89130 + }, + { + "epoch": 0.8172733107178876, + "learning_rate": 3.654717154121207e-05, + "loss": 0.9372, + "mean_token_accuracy": 0.7221430957317352, + "num_tokens": 215907995.0, + "step": 89140 + }, + { + "epoch": 0.8173649949573668, + "learning_rate": 3.652883469331622e-05, + "loss": 1.025, + "mean_token_accuracy": 0.6958905518054962, + "num_tokens": 215939823.0, + "step": 89150 + }, + { + "epoch": 0.8174566791968461, + "learning_rate": 3.651049784542037e-05, + "loss": 1.0073, + "mean_token_accuracy": 0.6971342086791992, + "num_tokens": 215970094.0, + "step": 89160 + }, + { + "epoch": 0.8175483634363253, + "learning_rate": 3.6492160997524525e-05, + "loss": 1.0489, + "mean_token_accuracy": 0.6948488593101502, + "num_tokens": 216001819.0, + "step": 89170 + }, + { + "epoch": 0.8176400476758046, + "learning_rate": 3.6473824149628684e-05, + "loss": 1.0069, + "mean_token_accuracy": 0.7015217125415802, + "num_tokens": 216031591.0, + "step": 89180 + }, + { + "epoch": 0.8177317319152838, + "learning_rate": 3.6455487301732836e-05, + "loss": 1.0493, + "mean_token_accuracy": 0.695898962020874, + "num_tokens": 216063653.0, + "step": 89190 + }, + { + "epoch": 0.817823416154763, + "learning_rate": 3.643715045383699e-05, + "loss": 1.0123, + "mean_token_accuracy": 0.6982617616653443, + "num_tokens": 216094424.0, + "step": 89200 + }, + { + "epoch": 0.8179151003942422, + "learning_rate": 3.641881360594114e-05, + "loss": 1.005, + "mean_token_accuracy": 0.7010263442993164, + "num_tokens": 216124983.0, + "step": 89210 + }, + { + "epoch": 0.8180067846337215, + "learning_rate": 3.640047675804529e-05, + "loss": 1.0066, + "mean_token_accuracy": 0.704931628704071, + "num_tokens": 216155769.0, + "step": 89220 + }, + { + "epoch": 0.8180984688732007, + "learning_rate": 3.638213991014945e-05, + "loss": 1.0059, + "mean_token_accuracy": 0.7023326694965363, + "num_tokens": 216186840.0, + "step": 89230 + }, + { + "epoch": 0.81819015311268, + "learning_rate": 3.63638030622536e-05, + "loss": 1.0034, + "mean_token_accuracy": 0.7027499079704285, + "num_tokens": 216217092.0, + "step": 89240 + }, + { + "epoch": 0.8182818373521592, + "learning_rate": 3.6345466214357754e-05, + "loss": 0.9911, + "mean_token_accuracy": 0.706219208240509, + "num_tokens": 216248515.0, + "step": 89250 + }, + { + "epoch": 0.8183735215916383, + "learning_rate": 3.632712936646191e-05, + "loss": 0.989, + "mean_token_accuracy": 0.709886884689331, + "num_tokens": 216279085.0, + "step": 89260 + }, + { + "epoch": 0.8184652058311176, + "learning_rate": 3.630879251856606e-05, + "loss": 0.997, + "mean_token_accuracy": 0.7053792595863342, + "num_tokens": 216311495.0, + "step": 89270 + }, + { + "epoch": 0.8185568900705968, + "learning_rate": 3.6290455670670216e-05, + "loss": 1.0224, + "mean_token_accuracy": 0.6974895119667053, + "num_tokens": 216340883.0, + "step": 89280 + }, + { + "epoch": 0.8186485743100761, + "learning_rate": 3.627211882277437e-05, + "loss": 0.9947, + "mean_token_accuracy": 0.7037676692008972, + "num_tokens": 216370882.0, + "step": 89290 + }, + { + "epoch": 0.8187402585495553, + "learning_rate": 3.625378197487852e-05, + "loss": 1.0227, + "mean_token_accuracy": 0.6979583740234375, + "num_tokens": 216401683.0, + "step": 89300 + }, + { + "epoch": 0.8188319427890346, + "learning_rate": 3.623544512698268e-05, + "loss": 1.0257, + "mean_token_accuracy": 0.6965280830860138, + "num_tokens": 216433933.0, + "step": 89310 + }, + { + "epoch": 0.8189236270285138, + "learning_rate": 3.6217108279086824e-05, + "loss": 1.0254, + "mean_token_accuracy": 0.6979999899864197, + "num_tokens": 216464153.0, + "step": 89320 + }, + { + "epoch": 0.819015311267993, + "learning_rate": 3.619877143119098e-05, + "loss": 1.0098, + "mean_token_accuracy": 0.7058261871337891, + "num_tokens": 216494895.0, + "step": 89330 + }, + { + "epoch": 0.8191069955074722, + "learning_rate": 3.6180434583295134e-05, + "loss": 0.9862, + "mean_token_accuracy": 0.7088732123374939, + "num_tokens": 216525433.0, + "step": 89340 + }, + { + "epoch": 0.8191986797469515, + "learning_rate": 3.6162097735399286e-05, + "loss": 1.0223, + "mean_token_accuracy": 0.697758823633194, + "num_tokens": 216556873.0, + "step": 89350 + }, + { + "epoch": 0.8192903639864307, + "learning_rate": 3.6143760887503445e-05, + "loss": 1.0144, + "mean_token_accuracy": 0.6988425016403198, + "num_tokens": 216588096.0, + "step": 89360 + }, + { + "epoch": 0.81938204822591, + "learning_rate": 3.612542403960759e-05, + "loss": 0.9913, + "mean_token_accuracy": 0.7108243405818939, + "num_tokens": 216619745.0, + "step": 89370 + }, + { + "epoch": 0.8194737324653892, + "learning_rate": 3.610708719171175e-05, + "loss": 1.0102, + "mean_token_accuracy": 0.7040644705295562, + "num_tokens": 216651167.0, + "step": 89380 + }, + { + "epoch": 0.8195654167048685, + "learning_rate": 3.60887503438159e-05, + "loss": 1.0176, + "mean_token_accuracy": 0.6944675505161285, + "num_tokens": 216681878.0, + "step": 89390 + }, + { + "epoch": 0.8196571009443476, + "learning_rate": 3.607041349592005e-05, + "loss": 0.9937, + "mean_token_accuracy": 0.7025558471679687, + "num_tokens": 216711604.0, + "step": 89400 + }, + { + "epoch": 0.8197487851838269, + "learning_rate": 3.605207664802421e-05, + "loss": 1.0134, + "mean_token_accuracy": 0.7018278241157532, + "num_tokens": 216744331.0, + "step": 89410 + }, + { + "epoch": 0.8198404694233061, + "learning_rate": 3.6033739800128356e-05, + "loss": 0.9921, + "mean_token_accuracy": 0.7037769675254821, + "num_tokens": 216775567.0, + "step": 89420 + }, + { + "epoch": 0.8199321536627854, + "learning_rate": 3.6015402952232514e-05, + "loss": 1.027, + "mean_token_accuracy": 0.6993145942687988, + "num_tokens": 216806757.0, + "step": 89430 + }, + { + "epoch": 0.8200238379022646, + "learning_rate": 3.5997066104336666e-05, + "loss": 0.9929, + "mean_token_accuracy": 0.704660850763321, + "num_tokens": 216837817.0, + "step": 89440 + }, + { + "epoch": 0.8201155221417439, + "learning_rate": 3.597872925644082e-05, + "loss": 1.0033, + "mean_token_accuracy": 0.7048147082328796, + "num_tokens": 216867635.0, + "step": 89450 + }, + { + "epoch": 0.820207206381223, + "learning_rate": 3.596039240854498e-05, + "loss": 0.9987, + "mean_token_accuracy": 0.7068140983581543, + "num_tokens": 216899603.0, + "step": 89460 + }, + { + "epoch": 0.8202988906207023, + "learning_rate": 3.594205556064912e-05, + "loss": 1.0177, + "mean_token_accuracy": 0.7009139716625213, + "num_tokens": 216930405.0, + "step": 89470 + }, + { + "epoch": 0.8203905748601815, + "learning_rate": 3.592371871275328e-05, + "loss": 0.9835, + "mean_token_accuracy": 0.7070664763450623, + "num_tokens": 216961820.0, + "step": 89480 + }, + { + "epoch": 0.8204822590996608, + "learning_rate": 3.590538186485743e-05, + "loss": 1.0187, + "mean_token_accuracy": 0.6993075489997864, + "num_tokens": 216992694.0, + "step": 89490 + }, + { + "epoch": 0.82057394333914, + "learning_rate": 3.5887045016961584e-05, + "loss": 1.0052, + "mean_token_accuracy": 0.6994746148586273, + "num_tokens": 217024756.0, + "step": 89500 + }, + { + "epoch": 0.8206656275786193, + "learning_rate": 3.586870816906574e-05, + "loss": 0.9744, + "mean_token_accuracy": 0.7065632164478302, + "num_tokens": 217052681.0, + "step": 89510 + }, + { + "epoch": 0.8207573118180985, + "learning_rate": 3.585037132116989e-05, + "loss": 0.9998, + "mean_token_accuracy": 0.7040503263473511, + "num_tokens": 217082496.0, + "step": 89520 + }, + { + "epoch": 0.8208489960575777, + "learning_rate": 3.583203447327405e-05, + "loss": 1.0255, + "mean_token_accuracy": 0.7011173784732818, + "num_tokens": 217113957.0, + "step": 89530 + }, + { + "epoch": 0.8209406802970569, + "learning_rate": 3.58136976253782e-05, + "loss": 0.9932, + "mean_token_accuracy": 0.7075741112232208, + "num_tokens": 217145042.0, + "step": 89540 + }, + { + "epoch": 0.8210323645365362, + "learning_rate": 3.579536077748235e-05, + "loss": 0.9658, + "mean_token_accuracy": 0.7145200908184052, + "num_tokens": 217176799.0, + "step": 89550 + }, + { + "epoch": 0.8211240487760154, + "learning_rate": 3.577702392958651e-05, + "loss": 0.9976, + "mean_token_accuracy": 0.7022757530212402, + "num_tokens": 217207580.0, + "step": 89560 + }, + { + "epoch": 0.8212157330154947, + "learning_rate": 3.575868708169066e-05, + "loss": 0.9734, + "mean_token_accuracy": 0.7052068829536438, + "num_tokens": 217238051.0, + "step": 89570 + }, + { + "epoch": 0.8213074172549739, + "learning_rate": 3.574035023379481e-05, + "loss": 1.0238, + "mean_token_accuracy": 0.6927455723285675, + "num_tokens": 217267887.0, + "step": 89580 + }, + { + "epoch": 0.821399101494453, + "learning_rate": 3.5722013385898965e-05, + "loss": 0.9652, + "mean_token_accuracy": 0.7125248312950134, + "num_tokens": 217299104.0, + "step": 89590 + }, + { + "epoch": 0.8214907857339323, + "learning_rate": 3.5703676538003117e-05, + "loss": 1.0341, + "mean_token_accuracy": 0.697223562002182, + "num_tokens": 217329923.0, + "step": 89600 + }, + { + "epoch": 0.8215824699734116, + "learning_rate": 3.5685339690107275e-05, + "loss": 1.0219, + "mean_token_accuracy": 0.6976146042346955, + "num_tokens": 217361147.0, + "step": 89610 + }, + { + "epoch": 0.8216741542128908, + "learning_rate": 3.566700284221143e-05, + "loss": 1.0214, + "mean_token_accuracy": 0.7045253276824951, + "num_tokens": 217392845.0, + "step": 89620 + }, + { + "epoch": 0.8217658384523701, + "learning_rate": 3.564866599431558e-05, + "loss": 1.0016, + "mean_token_accuracy": 0.7000697910785675, + "num_tokens": 217422580.0, + "step": 89630 + }, + { + "epoch": 0.8218575226918493, + "learning_rate": 3.563032914641973e-05, + "loss": 1.0179, + "mean_token_accuracy": 0.6992241501808166, + "num_tokens": 217450942.0, + "step": 89640 + }, + { + "epoch": 0.8219492069313286, + "learning_rate": 3.561199229852388e-05, + "loss": 1.0205, + "mean_token_accuracy": 0.6992136180400849, + "num_tokens": 217482403.0, + "step": 89650 + }, + { + "epoch": 0.8220408911708077, + "learning_rate": 3.559365545062804e-05, + "loss": 1.0334, + "mean_token_accuracy": 0.6970073759555817, + "num_tokens": 217514582.0, + "step": 89660 + }, + { + "epoch": 0.822132575410287, + "learning_rate": 3.557531860273219e-05, + "loss": 0.9955, + "mean_token_accuracy": 0.7020188570022583, + "num_tokens": 217546495.0, + "step": 89670 + }, + { + "epoch": 0.8222242596497662, + "learning_rate": 3.5556981754836345e-05, + "loss": 1.0184, + "mean_token_accuracy": 0.6983431875705719, + "num_tokens": 217578598.0, + "step": 89680 + }, + { + "epoch": 0.8223159438892454, + "learning_rate": 3.55386449069405e-05, + "loss": 1.0252, + "mean_token_accuracy": 0.6960439920425415, + "num_tokens": 217609151.0, + "step": 89690 + }, + { + "epoch": 0.8224076281287247, + "learning_rate": 3.5520308059044656e-05, + "loss": 0.9948, + "mean_token_accuracy": 0.6960030615329742, + "num_tokens": 217638871.0, + "step": 89700 + }, + { + "epoch": 0.822499312368204, + "learning_rate": 3.550197121114881e-05, + "loss": 1.0476, + "mean_token_accuracy": 0.6921974420547485, + "num_tokens": 217670232.0, + "step": 89710 + }, + { + "epoch": 0.8225909966076831, + "learning_rate": 3.548363436325296e-05, + "loss": 1.0083, + "mean_token_accuracy": 0.7024901568889618, + "num_tokens": 217701328.0, + "step": 89720 + }, + { + "epoch": 0.8226826808471623, + "learning_rate": 3.546529751535711e-05, + "loss": 1.0081, + "mean_token_accuracy": 0.7058868885040284, + "num_tokens": 217732749.0, + "step": 89730 + }, + { + "epoch": 0.8227743650866416, + "learning_rate": 3.544696066746126e-05, + "loss": 1.0074, + "mean_token_accuracy": 0.6999070465564727, + "num_tokens": 217764441.0, + "step": 89740 + }, + { + "epoch": 0.8228660493261208, + "learning_rate": 3.542862381956542e-05, + "loss": 1.0087, + "mean_token_accuracy": 0.6974696278572082, + "num_tokens": 217794611.0, + "step": 89750 + }, + { + "epoch": 0.8229577335656001, + "learning_rate": 3.5410286971669573e-05, + "loss": 0.9934, + "mean_token_accuracy": 0.7009398221969605, + "num_tokens": 217824505.0, + "step": 89760 + }, + { + "epoch": 0.8230494178050793, + "learning_rate": 3.5391950123773725e-05, + "loss": 1.0075, + "mean_token_accuracy": 0.7024871706962585, + "num_tokens": 217856092.0, + "step": 89770 + }, + { + "epoch": 0.8231411020445586, + "learning_rate": 3.537361327587788e-05, + "loss": 1.0062, + "mean_token_accuracy": 0.7027764260768891, + "num_tokens": 217888141.0, + "step": 89780 + }, + { + "epoch": 0.8232327862840377, + "learning_rate": 3.535527642798203e-05, + "loss": 1.0308, + "mean_token_accuracy": 0.6936926186084748, + "num_tokens": 217919838.0, + "step": 89790 + }, + { + "epoch": 0.823324470523517, + "learning_rate": 3.533693958008619e-05, + "loss": 0.9868, + "mean_token_accuracy": 0.7085601270198822, + "num_tokens": 217948838.0, + "step": 89800 + }, + { + "epoch": 0.8234161547629962, + "learning_rate": 3.531860273219034e-05, + "loss": 0.9783, + "mean_token_accuracy": 0.708295714855194, + "num_tokens": 217980138.0, + "step": 89810 + }, + { + "epoch": 0.8235078390024755, + "learning_rate": 3.530026588429449e-05, + "loss": 0.9814, + "mean_token_accuracy": 0.7044698834419251, + "num_tokens": 218010471.0, + "step": 89820 + }, + { + "epoch": 0.8235995232419547, + "learning_rate": 3.528192903639864e-05, + "loss": 1.0154, + "mean_token_accuracy": 0.7017762362957001, + "num_tokens": 218042498.0, + "step": 89830 + }, + { + "epoch": 0.823691207481434, + "learning_rate": 3.5263592188502795e-05, + "loss": 1.0158, + "mean_token_accuracy": 0.6979267001152039, + "num_tokens": 218074215.0, + "step": 89840 + }, + { + "epoch": 0.8237828917209131, + "learning_rate": 3.5245255340606954e-05, + "loss": 1.0274, + "mean_token_accuracy": 0.7039165735244751, + "num_tokens": 218105056.0, + "step": 89850 + }, + { + "epoch": 0.8238745759603924, + "learning_rate": 3.5226918492711106e-05, + "loss": 1.0199, + "mean_token_accuracy": 0.6995380878448486, + "num_tokens": 218136579.0, + "step": 89860 + }, + { + "epoch": 0.8239662601998716, + "learning_rate": 3.520858164481526e-05, + "loss": 1.0113, + "mean_token_accuracy": 0.6981495440006256, + "num_tokens": 218167125.0, + "step": 89870 + }, + { + "epoch": 0.8240579444393509, + "learning_rate": 3.5190244796919416e-05, + "loss": 1.0159, + "mean_token_accuracy": 0.6977125823497772, + "num_tokens": 218196264.0, + "step": 89880 + }, + { + "epoch": 0.8241496286788301, + "learning_rate": 3.517190794902356e-05, + "loss": 1.0179, + "mean_token_accuracy": 0.7013065934181213, + "num_tokens": 218227752.0, + "step": 89890 + }, + { + "epoch": 0.8242413129183094, + "learning_rate": 3.515357110112772e-05, + "loss": 1.0255, + "mean_token_accuracy": 0.6967093110084533, + "num_tokens": 218259509.0, + "step": 89900 + }, + { + "epoch": 0.8243329971577886, + "learning_rate": 3.513523425323187e-05, + "loss": 0.9907, + "mean_token_accuracy": 0.7059114515781403, + "num_tokens": 218290287.0, + "step": 89910 + }, + { + "epoch": 0.8244246813972678, + "learning_rate": 3.5116897405336024e-05, + "loss": 1.0226, + "mean_token_accuracy": 0.7021823167800904, + "num_tokens": 218321876.0, + "step": 89920 + }, + { + "epoch": 0.824516365636747, + "learning_rate": 3.509856055744018e-05, + "loss": 1.0221, + "mean_token_accuracy": 0.7003953516483307, + "num_tokens": 218352743.0, + "step": 89930 + }, + { + "epoch": 0.8246080498762263, + "learning_rate": 3.508022370954433e-05, + "loss": 0.9892, + "mean_token_accuracy": 0.7012200355529785, + "num_tokens": 218382613.0, + "step": 89940 + }, + { + "epoch": 0.8246997341157055, + "learning_rate": 3.5061886861648486e-05, + "loss": 1.0293, + "mean_token_accuracy": 0.6971102952957153, + "num_tokens": 218413926.0, + "step": 89950 + }, + { + "epoch": 0.8247914183551848, + "learning_rate": 3.504355001375264e-05, + "loss": 1.0004, + "mean_token_accuracy": 0.7024656474590302, + "num_tokens": 218445904.0, + "step": 89960 + }, + { + "epoch": 0.824883102594664, + "learning_rate": 3.502521316585679e-05, + "loss": 0.9816, + "mean_token_accuracy": 0.7075865745544434, + "num_tokens": 218477458.0, + "step": 89970 + }, + { + "epoch": 0.8249747868341432, + "learning_rate": 3.500687631796095e-05, + "loss": 1.0043, + "mean_token_accuracy": 0.7051225125789642, + "num_tokens": 218507963.0, + "step": 89980 + }, + { + "epoch": 0.8250664710736224, + "learning_rate": 3.4988539470065094e-05, + "loss": 1.0097, + "mean_token_accuracy": 0.7018232405185699, + "num_tokens": 218538219.0, + "step": 89990 + }, + { + "epoch": 0.8251581553131017, + "learning_rate": 3.497020262216925e-05, + "loss": 1.0053, + "mean_token_accuracy": 0.7008326649665833, + "num_tokens": 218567533.0, + "step": 90000 + }, + { + "epoch": 0.8252498395525809, + "learning_rate": 3.4951865774273404e-05, + "loss": 1.0281, + "mean_token_accuracy": 0.7011227130889892, + "num_tokens": 218599491.0, + "step": 90010 + }, + { + "epoch": 0.8253415237920602, + "learning_rate": 3.4933528926377556e-05, + "loss": 1.0019, + "mean_token_accuracy": 0.7045192062854767, + "num_tokens": 218631049.0, + "step": 90020 + }, + { + "epoch": 0.8254332080315394, + "learning_rate": 3.4915192078481715e-05, + "loss": 1.0167, + "mean_token_accuracy": 0.700628525018692, + "num_tokens": 218661502.0, + "step": 90030 + }, + { + "epoch": 0.8255248922710187, + "learning_rate": 3.489685523058586e-05, + "loss": 0.997, + "mean_token_accuracy": 0.7090557515621185, + "num_tokens": 218692564.0, + "step": 90040 + }, + { + "epoch": 0.8256165765104978, + "learning_rate": 3.487851838269002e-05, + "loss": 1.011, + "mean_token_accuracy": 0.6990772426128388, + "num_tokens": 218722354.0, + "step": 90050 + }, + { + "epoch": 0.825708260749977, + "learning_rate": 3.486018153479417e-05, + "loss": 1.0096, + "mean_token_accuracy": 0.700513380765915, + "num_tokens": 218752899.0, + "step": 90060 + }, + { + "epoch": 0.8257999449894563, + "learning_rate": 3.484184468689832e-05, + "loss": 1.0326, + "mean_token_accuracy": 0.7009813487529755, + "num_tokens": 218784013.0, + "step": 90070 + }, + { + "epoch": 0.8258916292289356, + "learning_rate": 3.482350783900248e-05, + "loss": 1.0228, + "mean_token_accuracy": 0.6992367684841156, + "num_tokens": 218815934.0, + "step": 90080 + }, + { + "epoch": 0.8259833134684148, + "learning_rate": 3.4805170991106626e-05, + "loss": 1.0141, + "mean_token_accuracy": 0.7031391203403473, + "num_tokens": 218846950.0, + "step": 90090 + }, + { + "epoch": 0.826074997707894, + "learning_rate": 3.4786834143210784e-05, + "loss": 1.0186, + "mean_token_accuracy": 0.6979718327522277, + "num_tokens": 218879495.0, + "step": 90100 + }, + { + "epoch": 0.8261666819473732, + "learning_rate": 3.4768497295314936e-05, + "loss": 1.0066, + "mean_token_accuracy": 0.697433739900589, + "num_tokens": 218909582.0, + "step": 90110 + }, + { + "epoch": 0.8262583661868524, + "learning_rate": 3.475016044741909e-05, + "loss": 0.9725, + "mean_token_accuracy": 0.7097954154014587, + "num_tokens": 218938605.0, + "step": 90120 + }, + { + "epoch": 0.8263500504263317, + "learning_rate": 3.473182359952325e-05, + "loss": 1.0176, + "mean_token_accuracy": 0.6963508069515228, + "num_tokens": 218970352.0, + "step": 90130 + }, + { + "epoch": 0.826441734665811, + "learning_rate": 3.471348675162739e-05, + "loss": 1.0314, + "mean_token_accuracy": 0.6978467702865601, + "num_tokens": 219001659.0, + "step": 90140 + }, + { + "epoch": 0.8265334189052902, + "learning_rate": 3.469514990373155e-05, + "loss": 1.0079, + "mean_token_accuracy": 0.7022634148597717, + "num_tokens": 219032760.0, + "step": 90150 + }, + { + "epoch": 0.8266251031447694, + "learning_rate": 3.46768130558357e-05, + "loss": 1.004, + "mean_token_accuracy": 0.6996465802192688, + "num_tokens": 219063722.0, + "step": 90160 + }, + { + "epoch": 0.8267167873842487, + "learning_rate": 3.4658476207939854e-05, + "loss": 1.0202, + "mean_token_accuracy": 0.7048012614250183, + "num_tokens": 219093961.0, + "step": 90170 + }, + { + "epoch": 0.8268084716237278, + "learning_rate": 3.464013936004401e-05, + "loss": 0.9807, + "mean_token_accuracy": 0.7043280661106109, + "num_tokens": 219121756.0, + "step": 90180 + }, + { + "epoch": 0.8269001558632071, + "learning_rate": 3.4621802512148165e-05, + "loss": 0.9924, + "mean_token_accuracy": 0.7078893721103668, + "num_tokens": 219153052.0, + "step": 90190 + }, + { + "epoch": 0.8269918401026863, + "learning_rate": 3.460346566425232e-05, + "loss": 1.0259, + "mean_token_accuracy": 0.6989540219306946, + "num_tokens": 219184459.0, + "step": 90200 + }, + { + "epoch": 0.8270835243421656, + "learning_rate": 3.458512881635647e-05, + "loss": 1.0017, + "mean_token_accuracy": 0.7045412361621857, + "num_tokens": 219215437.0, + "step": 90210 + }, + { + "epoch": 0.8271752085816448, + "learning_rate": 3.456679196846062e-05, + "loss": 1.0165, + "mean_token_accuracy": 0.7025941193103791, + "num_tokens": 219247036.0, + "step": 90220 + }, + { + "epoch": 0.8272668928211241, + "learning_rate": 3.454845512056478e-05, + "loss": 1.0215, + "mean_token_accuracy": 0.698662930727005, + "num_tokens": 219277685.0, + "step": 90230 + }, + { + "epoch": 0.8273585770606032, + "learning_rate": 3.453011827266893e-05, + "loss": 1.0025, + "mean_token_accuracy": 0.7031780660152436, + "num_tokens": 219307850.0, + "step": 90240 + }, + { + "epoch": 0.8274502613000825, + "learning_rate": 3.451178142477308e-05, + "loss": 1.008, + "mean_token_accuracy": 0.7078184187412262, + "num_tokens": 219338499.0, + "step": 90250 + }, + { + "epoch": 0.8275419455395617, + "learning_rate": 3.4493444576877235e-05, + "loss": 0.9852, + "mean_token_accuracy": 0.7059654235839844, + "num_tokens": 219370701.0, + "step": 90260 + }, + { + "epoch": 0.827633629779041, + "learning_rate": 3.4475107728981386e-05, + "loss": 1.017, + "mean_token_accuracy": 0.6988462030887603, + "num_tokens": 219401369.0, + "step": 90270 + }, + { + "epoch": 0.8277253140185202, + "learning_rate": 3.4456770881085545e-05, + "loss": 1.0309, + "mean_token_accuracy": 0.6990213990211487, + "num_tokens": 219434393.0, + "step": 90280 + }, + { + "epoch": 0.8278169982579995, + "learning_rate": 3.44384340331897e-05, + "loss": 0.9756, + "mean_token_accuracy": 0.706069940328598, + "num_tokens": 219463910.0, + "step": 90290 + }, + { + "epoch": 0.8279086824974787, + "learning_rate": 3.442009718529385e-05, + "loss": 0.9971, + "mean_token_accuracy": 0.7024085760116577, + "num_tokens": 219492780.0, + "step": 90300 + }, + { + "epoch": 0.8280003667369579, + "learning_rate": 3.4401760337398e-05, + "loss": 1.0256, + "mean_token_accuracy": 0.6982463598251343, + "num_tokens": 219524639.0, + "step": 90310 + }, + { + "epoch": 0.8280920509764371, + "learning_rate": 3.438342348950216e-05, + "loss": 1.0181, + "mean_token_accuracy": 0.6987064480781555, + "num_tokens": 219556189.0, + "step": 90320 + }, + { + "epoch": 0.8281837352159164, + "learning_rate": 3.436508664160631e-05, + "loss": 1.0209, + "mean_token_accuracy": 0.700279176235199, + "num_tokens": 219586879.0, + "step": 90330 + }, + { + "epoch": 0.8282754194553956, + "learning_rate": 3.434674979371046e-05, + "loss": 1.0371, + "mean_token_accuracy": 0.6897796988487244, + "num_tokens": 219618058.0, + "step": 90340 + }, + { + "epoch": 0.8283671036948749, + "learning_rate": 3.4328412945814615e-05, + "loss": 1.034, + "mean_token_accuracy": 0.6963342905044556, + "num_tokens": 219647893.0, + "step": 90350 + }, + { + "epoch": 0.8284587879343541, + "learning_rate": 3.431007609791877e-05, + "loss": 0.9868, + "mean_token_accuracy": 0.7044245958328247, + "num_tokens": 219678596.0, + "step": 90360 + }, + { + "epoch": 0.8285504721738333, + "learning_rate": 3.4291739250022925e-05, + "loss": 1.0159, + "mean_token_accuracy": 0.7038574755191803, + "num_tokens": 219709534.0, + "step": 90370 + }, + { + "epoch": 0.8286421564133125, + "learning_rate": 3.427340240212708e-05, + "loss": 1.0055, + "mean_token_accuracy": 0.7060499966144562, + "num_tokens": 219739381.0, + "step": 90380 + }, + { + "epoch": 0.8287338406527918, + "learning_rate": 3.425506555423123e-05, + "loss": 0.9914, + "mean_token_accuracy": 0.7050133585929871, + "num_tokens": 219770230.0, + "step": 90390 + }, + { + "epoch": 0.828825524892271, + "learning_rate": 3.423672870633538e-05, + "loss": 1.0049, + "mean_token_accuracy": 0.7040414988994599, + "num_tokens": 219800660.0, + "step": 90400 + }, + { + "epoch": 0.8289172091317503, + "learning_rate": 3.421839185843953e-05, + "loss": 1.0395, + "mean_token_accuracy": 0.6939877152442933, + "num_tokens": 219831733.0, + "step": 90410 + }, + { + "epoch": 0.8290088933712295, + "learning_rate": 3.420005501054369e-05, + "loss": 1.0159, + "mean_token_accuracy": 0.698121440410614, + "num_tokens": 219861302.0, + "step": 90420 + }, + { + "epoch": 0.8291005776107088, + "learning_rate": 3.4181718162647843e-05, + "loss": 1.003, + "mean_token_accuracy": 0.6998128890991211, + "num_tokens": 219891627.0, + "step": 90430 + }, + { + "epoch": 0.8291922618501879, + "learning_rate": 3.4163381314751995e-05, + "loss": 1.0458, + "mean_token_accuracy": 0.6945520102977752, + "num_tokens": 219923847.0, + "step": 90440 + }, + { + "epoch": 0.8292839460896672, + "learning_rate": 3.414504446685615e-05, + "loss": 0.9994, + "mean_token_accuracy": 0.7000109255313873, + "num_tokens": 219955720.0, + "step": 90450 + }, + { + "epoch": 0.8293756303291464, + "learning_rate": 3.41267076189603e-05, + "loss": 1.0181, + "mean_token_accuracy": 0.6990287780761719, + "num_tokens": 219987438.0, + "step": 90460 + }, + { + "epoch": 0.8294673145686257, + "learning_rate": 3.410837077106446e-05, + "loss": 1.0016, + "mean_token_accuracy": 0.7014613449573517, + "num_tokens": 220016924.0, + "step": 90470 + }, + { + "epoch": 0.8295589988081049, + "learning_rate": 3.409003392316861e-05, + "loss": 1.0117, + "mean_token_accuracy": 0.6967711329460144, + "num_tokens": 220046028.0, + "step": 90480 + }, + { + "epoch": 0.8296506830475842, + "learning_rate": 3.407169707527276e-05, + "loss": 1.0282, + "mean_token_accuracy": 0.7010338187217713, + "num_tokens": 220077468.0, + "step": 90490 + }, + { + "epoch": 0.8297423672870634, + "learning_rate": 3.405336022737692e-05, + "loss": 1.0289, + "mean_token_accuracy": 0.6963151395320892, + "num_tokens": 220109071.0, + "step": 90500 + }, + { + "epoch": 0.8298340515265425, + "learning_rate": 3.4035023379481065e-05, + "loss": 0.9816, + "mean_token_accuracy": 0.7081152498722076, + "num_tokens": 220140515.0, + "step": 90510 + }, + { + "epoch": 0.8299257357660218, + "learning_rate": 3.4016686531585224e-05, + "loss": 1.0178, + "mean_token_accuracy": 0.6993720293045044, + "num_tokens": 220170837.0, + "step": 90520 + }, + { + "epoch": 0.830017420005501, + "learning_rate": 3.3998349683689376e-05, + "loss": 1.0202, + "mean_token_accuracy": 0.7022325396537781, + "num_tokens": 220201937.0, + "step": 90530 + }, + { + "epoch": 0.8301091042449803, + "learning_rate": 3.398001283579353e-05, + "loss": 1.0012, + "mean_token_accuracy": 0.6982310712337494, + "num_tokens": 220231434.0, + "step": 90540 + }, + { + "epoch": 0.8302007884844596, + "learning_rate": 3.3961675987897686e-05, + "loss": 1.0367, + "mean_token_accuracy": 0.699015998840332, + "num_tokens": 220263165.0, + "step": 90550 + }, + { + "epoch": 0.8302924727239388, + "learning_rate": 3.394333914000183e-05, + "loss": 1.0574, + "mean_token_accuracy": 0.6866241574287415, + "num_tokens": 220295248.0, + "step": 90560 + }, + { + "epoch": 0.8303841569634179, + "learning_rate": 3.392500229210599e-05, + "loss": 1.0033, + "mean_token_accuracy": 0.7033745348453522, + "num_tokens": 220326770.0, + "step": 90570 + }, + { + "epoch": 0.8304758412028972, + "learning_rate": 3.390666544421014e-05, + "loss": 0.984, + "mean_token_accuracy": 0.7064521014690399, + "num_tokens": 220357751.0, + "step": 90580 + }, + { + "epoch": 0.8305675254423764, + "learning_rate": 3.3888328596314294e-05, + "loss": 1.0167, + "mean_token_accuracy": 0.6974581778049469, + "num_tokens": 220388449.0, + "step": 90590 + }, + { + "epoch": 0.8306592096818557, + "learning_rate": 3.386999174841845e-05, + "loss": 1.0096, + "mean_token_accuracy": 0.6993870735168457, + "num_tokens": 220418448.0, + "step": 90600 + }, + { + "epoch": 0.8307508939213349, + "learning_rate": 3.38516549005226e-05, + "loss": 1.0177, + "mean_token_accuracy": 0.7009082913398743, + "num_tokens": 220450316.0, + "step": 90610 + }, + { + "epoch": 0.8308425781608142, + "learning_rate": 3.3833318052626756e-05, + "loss": 1.0182, + "mean_token_accuracy": 0.6961587607860565, + "num_tokens": 220482135.0, + "step": 90620 + }, + { + "epoch": 0.8309342624002934, + "learning_rate": 3.381498120473091e-05, + "loss": 0.9942, + "mean_token_accuracy": 0.7034704446792602, + "num_tokens": 220514095.0, + "step": 90630 + }, + { + "epoch": 0.8310259466397726, + "learning_rate": 3.379664435683506e-05, + "loss": 1.0255, + "mean_token_accuracy": 0.6975188851356506, + "num_tokens": 220545431.0, + "step": 90640 + }, + { + "epoch": 0.8311176308792518, + "learning_rate": 3.377830750893922e-05, + "loss": 1.0203, + "mean_token_accuracy": 0.6978191614151001, + "num_tokens": 220575769.0, + "step": 90650 + }, + { + "epoch": 0.8312093151187311, + "learning_rate": 3.3759970661043364e-05, + "loss": 0.9952, + "mean_token_accuracy": 0.6992539465427399, + "num_tokens": 220604764.0, + "step": 90660 + }, + { + "epoch": 0.8313009993582103, + "learning_rate": 3.374163381314752e-05, + "loss": 1.0284, + "mean_token_accuracy": 0.6933148920536041, + "num_tokens": 220636782.0, + "step": 90670 + }, + { + "epoch": 0.8313926835976896, + "learning_rate": 3.3723296965251674e-05, + "loss": 1.0167, + "mean_token_accuracy": 0.6988054394721985, + "num_tokens": 220668817.0, + "step": 90680 + }, + { + "epoch": 0.8314843678371688, + "learning_rate": 3.3704960117355826e-05, + "loss": 1.0148, + "mean_token_accuracy": 0.6956416130065918, + "num_tokens": 220699556.0, + "step": 90690 + }, + { + "epoch": 0.831576052076648, + "learning_rate": 3.3686623269459985e-05, + "loss": 1.0118, + "mean_token_accuracy": 0.6987706780433655, + "num_tokens": 220730887.0, + "step": 90700 + }, + { + "epoch": 0.8316677363161272, + "learning_rate": 3.366828642156413e-05, + "loss": 1.0083, + "mean_token_accuracy": 0.7023152768611908, + "num_tokens": 220761398.0, + "step": 90710 + }, + { + "epoch": 0.8317594205556065, + "learning_rate": 3.364994957366829e-05, + "loss": 1.0054, + "mean_token_accuracy": 0.7016844093799591, + "num_tokens": 220791129.0, + "step": 90720 + }, + { + "epoch": 0.8318511047950857, + "learning_rate": 3.363161272577244e-05, + "loss": 0.9968, + "mean_token_accuracy": 0.7054231762886047, + "num_tokens": 220822540.0, + "step": 90730 + }, + { + "epoch": 0.831942789034565, + "learning_rate": 3.361327587787659e-05, + "loss": 1.0025, + "mean_token_accuracy": 0.7013937592506408, + "num_tokens": 220852936.0, + "step": 90740 + }, + { + "epoch": 0.8320344732740442, + "learning_rate": 3.359493902998075e-05, + "loss": 1.0188, + "mean_token_accuracy": 0.7003185212612152, + "num_tokens": 220884434.0, + "step": 90750 + }, + { + "epoch": 0.8321261575135235, + "learning_rate": 3.3576602182084896e-05, + "loss": 1.0149, + "mean_token_accuracy": 0.6970611453056336, + "num_tokens": 220916046.0, + "step": 90760 + }, + { + "epoch": 0.8322178417530026, + "learning_rate": 3.3558265334189054e-05, + "loss": 1.0136, + "mean_token_accuracy": 0.6984663009643555, + "num_tokens": 220946779.0, + "step": 90770 + }, + { + "epoch": 0.8323095259924819, + "learning_rate": 3.3539928486293206e-05, + "loss": 0.9984, + "mean_token_accuracy": 0.7013566851615906, + "num_tokens": 220976094.0, + "step": 90780 + }, + { + "epoch": 0.8324012102319611, + "learning_rate": 3.352159163839736e-05, + "loss": 1.0262, + "mean_token_accuracy": 0.6944224417209626, + "num_tokens": 221008597.0, + "step": 90790 + }, + { + "epoch": 0.8324928944714404, + "learning_rate": 3.350325479050152e-05, + "loss": 1.009, + "mean_token_accuracy": 0.7017030000686646, + "num_tokens": 221039625.0, + "step": 90800 + }, + { + "epoch": 0.8325845787109196, + "learning_rate": 3.348491794260567e-05, + "loss": 1.0247, + "mean_token_accuracy": 0.6982905983924865, + "num_tokens": 221071119.0, + "step": 90810 + }, + { + "epoch": 0.8326762629503989, + "learning_rate": 3.346658109470982e-05, + "loss": 1.0039, + "mean_token_accuracy": 0.695676851272583, + "num_tokens": 221101358.0, + "step": 90820 + }, + { + "epoch": 0.832767947189878, + "learning_rate": 3.344824424681397e-05, + "loss": 1.0041, + "mean_token_accuracy": 0.7050034761428833, + "num_tokens": 221131862.0, + "step": 90830 + }, + { + "epoch": 0.8328596314293573, + "learning_rate": 3.3429907398918124e-05, + "loss": 1.01, + "mean_token_accuracy": 0.6967243671417236, + "num_tokens": 221161063.0, + "step": 90840 + }, + { + "epoch": 0.8329513156688365, + "learning_rate": 3.341157055102228e-05, + "loss": 0.9924, + "mean_token_accuracy": 0.701437908411026, + "num_tokens": 221192622.0, + "step": 90850 + }, + { + "epoch": 0.8330429999083158, + "learning_rate": 3.3393233703126435e-05, + "loss": 1.0119, + "mean_token_accuracy": 0.7018767178058625, + "num_tokens": 221223913.0, + "step": 90860 + }, + { + "epoch": 0.833134684147795, + "learning_rate": 3.337489685523059e-05, + "loss": 1.036, + "mean_token_accuracy": 0.6921814620494843, + "num_tokens": 221255890.0, + "step": 90870 + }, + { + "epoch": 0.8332263683872743, + "learning_rate": 3.335656000733474e-05, + "loss": 1.0031, + "mean_token_accuracy": 0.7054585635662078, + "num_tokens": 221286108.0, + "step": 90880 + }, + { + "epoch": 0.8333180526267535, + "learning_rate": 3.333822315943889e-05, + "loss": 0.9852, + "mean_token_accuracy": 0.7051441967487335, + "num_tokens": 221316435.0, + "step": 90890 + }, + { + "epoch": 0.8334097368662327, + "learning_rate": 3.331988631154305e-05, + "loss": 1.0213, + "mean_token_accuracy": 0.700000774860382, + "num_tokens": 221345928.0, + "step": 90900 + }, + { + "epoch": 0.8335014211057119, + "learning_rate": 3.33015494636472e-05, + "loss": 1.0119, + "mean_token_accuracy": 0.6981248319149017, + "num_tokens": 221377151.0, + "step": 90910 + }, + { + "epoch": 0.8335931053451912, + "learning_rate": 3.328321261575135e-05, + "loss": 1.0044, + "mean_token_accuracy": 0.6982454180717468, + "num_tokens": 221407959.0, + "step": 90920 + }, + { + "epoch": 0.8336847895846704, + "learning_rate": 3.3264875767855505e-05, + "loss": 1.0177, + "mean_token_accuracy": 0.6998045980930329, + "num_tokens": 221439794.0, + "step": 90930 + }, + { + "epoch": 0.8337764738241497, + "learning_rate": 3.324653891995966e-05, + "loss": 1.0388, + "mean_token_accuracy": 0.6901152074337006, + "num_tokens": 221472015.0, + "step": 90940 + }, + { + "epoch": 0.8338681580636289, + "learning_rate": 3.3228202072063815e-05, + "loss": 0.9849, + "mean_token_accuracy": 0.6987499892711639, + "num_tokens": 221502175.0, + "step": 90950 + }, + { + "epoch": 0.833959842303108, + "learning_rate": 3.320986522416797e-05, + "loss": 1.0011, + "mean_token_accuracy": 0.7005788147449493, + "num_tokens": 221531535.0, + "step": 90960 + }, + { + "epoch": 0.8340515265425873, + "learning_rate": 3.319152837627212e-05, + "loss": 1.0067, + "mean_token_accuracy": 0.6989462614059448, + "num_tokens": 221562774.0, + "step": 90970 + }, + { + "epoch": 0.8341432107820665, + "learning_rate": 3.317319152837627e-05, + "loss": 1.0042, + "mean_token_accuracy": 0.7047168850898743, + "num_tokens": 221593380.0, + "step": 90980 + }, + { + "epoch": 0.8342348950215458, + "learning_rate": 3.315485468048043e-05, + "loss": 1.003, + "mean_token_accuracy": 0.7033378303050994, + "num_tokens": 221624592.0, + "step": 90990 + }, + { + "epoch": 0.834326579261025, + "learning_rate": 3.313651783258458e-05, + "loss": 1.038, + "mean_token_accuracy": 0.6974779486656189, + "num_tokens": 221656119.0, + "step": 91000 + }, + { + "epoch": 0.8344182635005043, + "learning_rate": 3.311818098468873e-05, + "loss": 0.9984, + "mean_token_accuracy": 0.7083793520927429, + "num_tokens": 221686031.0, + "step": 91010 + }, + { + "epoch": 0.8345099477399835, + "learning_rate": 3.3099844136792885e-05, + "loss": 1.0157, + "mean_token_accuracy": 0.7002842545509338, + "num_tokens": 221717223.0, + "step": 91020 + }, + { + "epoch": 0.8346016319794627, + "learning_rate": 3.308150728889704e-05, + "loss": 1.0262, + "mean_token_accuracy": 0.6953075408935547, + "num_tokens": 221749389.0, + "step": 91030 + }, + { + "epoch": 0.8346933162189419, + "learning_rate": 3.3063170441001195e-05, + "loss": 1.0022, + "mean_token_accuracy": 0.700938618183136, + "num_tokens": 221779349.0, + "step": 91040 + }, + { + "epoch": 0.8347850004584212, + "learning_rate": 3.304483359310535e-05, + "loss": 1.0029, + "mean_token_accuracy": 0.703021252155304, + "num_tokens": 221810248.0, + "step": 91050 + }, + { + "epoch": 0.8348766846979004, + "learning_rate": 3.30264967452095e-05, + "loss": 0.9991, + "mean_token_accuracy": 0.7039738297462463, + "num_tokens": 221842744.0, + "step": 91060 + }, + { + "epoch": 0.8349683689373797, + "learning_rate": 3.300815989731365e-05, + "loss": 1.0108, + "mean_token_accuracy": 0.7010632276535034, + "num_tokens": 221871445.0, + "step": 91070 + }, + { + "epoch": 0.8350600531768589, + "learning_rate": 3.29898230494178e-05, + "loss": 0.9787, + "mean_token_accuracy": 0.7070703208446503, + "num_tokens": 221900249.0, + "step": 91080 + }, + { + "epoch": 0.8351517374163381, + "learning_rate": 3.297148620152196e-05, + "loss": 1.0075, + "mean_token_accuracy": 0.6969705879688263, + "num_tokens": 221932060.0, + "step": 91090 + }, + { + "epoch": 0.8352434216558173, + "learning_rate": 3.2953149353626113e-05, + "loss": 0.9713, + "mean_token_accuracy": 0.7090980887413025, + "num_tokens": 221962548.0, + "step": 91100 + }, + { + "epoch": 0.8353351058952966, + "learning_rate": 3.2934812505730265e-05, + "loss": 1.0061, + "mean_token_accuracy": 0.7025028169155121, + "num_tokens": 221992851.0, + "step": 91110 + }, + { + "epoch": 0.8354267901347758, + "learning_rate": 3.2916475657834424e-05, + "loss": 0.9818, + "mean_token_accuracy": 0.7086591601371766, + "num_tokens": 222023824.0, + "step": 91120 + }, + { + "epoch": 0.8355184743742551, + "learning_rate": 3.289813880993857e-05, + "loss": 0.9995, + "mean_token_accuracy": 0.7047827005386352, + "num_tokens": 222054188.0, + "step": 91130 + }, + { + "epoch": 0.8356101586137343, + "learning_rate": 3.287980196204273e-05, + "loss": 0.9851, + "mean_token_accuracy": 0.701361620426178, + "num_tokens": 222081929.0, + "step": 91140 + }, + { + "epoch": 0.8357018428532136, + "learning_rate": 3.286146511414688e-05, + "loss": 0.9817, + "mean_token_accuracy": 0.7063040316104889, + "num_tokens": 222112090.0, + "step": 91150 + }, + { + "epoch": 0.8357935270926927, + "learning_rate": 3.284312826625103e-05, + "loss": 1.0185, + "mean_token_accuracy": 0.6978872060775757, + "num_tokens": 222143478.0, + "step": 91160 + }, + { + "epoch": 0.835885211332172, + "learning_rate": 3.282479141835519e-05, + "loss": 1.0516, + "mean_token_accuracy": 0.6882432162761688, + "num_tokens": 222174845.0, + "step": 91170 + }, + { + "epoch": 0.8359768955716512, + "learning_rate": 3.2806454570459335e-05, + "loss": 0.9762, + "mean_token_accuracy": 0.7065334260463715, + "num_tokens": 222205944.0, + "step": 91180 + }, + { + "epoch": 0.8360685798111305, + "learning_rate": 3.2788117722563494e-05, + "loss": 0.9541, + "mean_token_accuracy": 0.7162926018238067, + "num_tokens": 222236445.0, + "step": 91190 + }, + { + "epoch": 0.8361602640506097, + "learning_rate": 3.2769780874667646e-05, + "loss": 0.9723, + "mean_token_accuracy": 0.7066868841648102, + "num_tokens": 222265041.0, + "step": 91200 + }, + { + "epoch": 0.836251948290089, + "learning_rate": 3.27514440267718e-05, + "loss": 1.0265, + "mean_token_accuracy": 0.6991253197193146, + "num_tokens": 222296667.0, + "step": 91210 + }, + { + "epoch": 0.8363436325295681, + "learning_rate": 3.2733107178875956e-05, + "loss": 0.9812, + "mean_token_accuracy": 0.7063963234424591, + "num_tokens": 222327158.0, + "step": 91220 + }, + { + "epoch": 0.8364353167690474, + "learning_rate": 3.27147703309801e-05, + "loss": 1.0213, + "mean_token_accuracy": 0.6984895050525666, + "num_tokens": 222357989.0, + "step": 91230 + }, + { + "epoch": 0.8365270010085266, + "learning_rate": 3.269643348308426e-05, + "loss": 1.0321, + "mean_token_accuracy": 0.7004836976528168, + "num_tokens": 222388577.0, + "step": 91240 + }, + { + "epoch": 0.8366186852480059, + "learning_rate": 3.267809663518841e-05, + "loss": 0.9905, + "mean_token_accuracy": 0.7060478389263153, + "num_tokens": 222418326.0, + "step": 91250 + }, + { + "epoch": 0.8367103694874851, + "learning_rate": 3.2659759787292564e-05, + "loss": 0.9547, + "mean_token_accuracy": 0.7119473099708558, + "num_tokens": 222446805.0, + "step": 91260 + }, + { + "epoch": 0.8368020537269644, + "learning_rate": 3.264142293939672e-05, + "loss": 0.986, + "mean_token_accuracy": 0.7030215203762055, + "num_tokens": 222477988.0, + "step": 91270 + }, + { + "epoch": 0.8368937379664436, + "learning_rate": 3.262308609150087e-05, + "loss": 1.0069, + "mean_token_accuracy": 0.698031347990036, + "num_tokens": 222509889.0, + "step": 91280 + }, + { + "epoch": 0.8369854222059228, + "learning_rate": 3.2604749243605026e-05, + "loss": 0.9937, + "mean_token_accuracy": 0.699799257516861, + "num_tokens": 222541293.0, + "step": 91290 + }, + { + "epoch": 0.837077106445402, + "learning_rate": 3.2586412395709185e-05, + "loss": 1.0211, + "mean_token_accuracy": 0.6946413099765778, + "num_tokens": 222572968.0, + "step": 91300 + }, + { + "epoch": 0.8371687906848813, + "learning_rate": 3.256807554781333e-05, + "loss": 0.9897, + "mean_token_accuracy": 0.7046654760837555, + "num_tokens": 222604491.0, + "step": 91310 + }, + { + "epoch": 0.8372604749243605, + "learning_rate": 3.254973869991749e-05, + "loss": 0.9729, + "mean_token_accuracy": 0.7089137971401215, + "num_tokens": 222632305.0, + "step": 91320 + }, + { + "epoch": 0.8373521591638398, + "learning_rate": 3.2531401852021634e-05, + "loss": 1.0027, + "mean_token_accuracy": 0.7008799970149994, + "num_tokens": 222663773.0, + "step": 91330 + }, + { + "epoch": 0.837443843403319, + "learning_rate": 3.251306500412579e-05, + "loss": 0.9815, + "mean_token_accuracy": 0.7048599421977997, + "num_tokens": 222694460.0, + "step": 91340 + }, + { + "epoch": 0.8375355276427981, + "learning_rate": 3.249472815622995e-05, + "loss": 1.0105, + "mean_token_accuracy": 0.7016370117664337, + "num_tokens": 222725008.0, + "step": 91350 + }, + { + "epoch": 0.8376272118822774, + "learning_rate": 3.2476391308334096e-05, + "loss": 0.9618, + "mean_token_accuracy": 0.7082127451896667, + "num_tokens": 222755161.0, + "step": 91360 + }, + { + "epoch": 0.8377188961217567, + "learning_rate": 3.2458054460438255e-05, + "loss": 1.0034, + "mean_token_accuracy": 0.6991991460323334, + "num_tokens": 222786384.0, + "step": 91370 + }, + { + "epoch": 0.8378105803612359, + "learning_rate": 3.24397176125424e-05, + "loss": 0.9636, + "mean_token_accuracy": 0.7071750700473786, + "num_tokens": 222815206.0, + "step": 91380 + }, + { + "epoch": 0.8379022646007152, + "learning_rate": 3.242138076464656e-05, + "loss": 0.9969, + "mean_token_accuracy": 0.7010862648487091, + "num_tokens": 222846301.0, + "step": 91390 + }, + { + "epoch": 0.8379939488401944, + "learning_rate": 3.240304391675072e-05, + "loss": 1.0288, + "mean_token_accuracy": 0.7008266806602478, + "num_tokens": 222877510.0, + "step": 91400 + }, + { + "epoch": 0.8380856330796737, + "learning_rate": 3.238470706885486e-05, + "loss": 1.0092, + "mean_token_accuracy": 0.7055033504962921, + "num_tokens": 222909382.0, + "step": 91410 + }, + { + "epoch": 0.8381773173191528, + "learning_rate": 3.236637022095902e-05, + "loss": 0.9609, + "mean_token_accuracy": 0.7142740547657013, + "num_tokens": 222939790.0, + "step": 91420 + }, + { + "epoch": 0.838269001558632, + "learning_rate": 3.234803337306317e-05, + "loss": 0.9964, + "mean_token_accuracy": 0.7005717277526855, + "num_tokens": 222971254.0, + "step": 91430 + }, + { + "epoch": 0.8383606857981113, + "learning_rate": 3.2329696525167324e-05, + "loss": 1.0312, + "mean_token_accuracy": 0.6940638840198516, + "num_tokens": 223000601.0, + "step": 91440 + }, + { + "epoch": 0.8384523700375905, + "learning_rate": 3.231135967727148e-05, + "loss": 1.0222, + "mean_token_accuracy": 0.6965833485126496, + "num_tokens": 223031669.0, + "step": 91450 + }, + { + "epoch": 0.8385440542770698, + "learning_rate": 3.229302282937563e-05, + "loss": 1.0148, + "mean_token_accuracy": 0.6938436567783356, + "num_tokens": 223062222.0, + "step": 91460 + }, + { + "epoch": 0.838635738516549, + "learning_rate": 3.227468598147979e-05, + "loss": 1.0141, + "mean_token_accuracy": 0.6961119532585144, + "num_tokens": 223093582.0, + "step": 91470 + }, + { + "epoch": 0.8387274227560282, + "learning_rate": 3.225634913358394e-05, + "loss": 1.0159, + "mean_token_accuracy": 0.7005566835403443, + "num_tokens": 223124729.0, + "step": 91480 + }, + { + "epoch": 0.8388191069955074, + "learning_rate": 3.223801228568809e-05, + "loss": 0.9972, + "mean_token_accuracy": 0.7011977195739746, + "num_tokens": 223155276.0, + "step": 91490 + }, + { + "epoch": 0.8389107912349867, + "learning_rate": 3.221967543779225e-05, + "loss": 0.9902, + "mean_token_accuracy": 0.7020883321762085, + "num_tokens": 223183719.0, + "step": 91500 + }, + { + "epoch": 0.8390024754744659, + "learning_rate": 3.2201338589896394e-05, + "loss": 0.9973, + "mean_token_accuracy": 0.7041495442390442, + "num_tokens": 223214502.0, + "step": 91510 + }, + { + "epoch": 0.8390941597139452, + "learning_rate": 3.218300174200055e-05, + "loss": 1.0081, + "mean_token_accuracy": 0.6985054612159729, + "num_tokens": 223246196.0, + "step": 91520 + }, + { + "epoch": 0.8391858439534244, + "learning_rate": 3.2164664894104705e-05, + "loss": 0.9957, + "mean_token_accuracy": 0.7056102693080902, + "num_tokens": 223277272.0, + "step": 91530 + }, + { + "epoch": 0.8392775281929037, + "learning_rate": 3.214632804620886e-05, + "loss": 1.0193, + "mean_token_accuracy": 0.6959621608257294, + "num_tokens": 223307640.0, + "step": 91540 + }, + { + "epoch": 0.8393692124323828, + "learning_rate": 3.2127991198313015e-05, + "loss": 1.0015, + "mean_token_accuracy": 0.7042932510375977, + "num_tokens": 223337961.0, + "step": 91550 + }, + { + "epoch": 0.8394608966718621, + "learning_rate": 3.210965435041716e-05, + "loss": 0.9959, + "mean_token_accuracy": 0.7025859355926514, + "num_tokens": 223367569.0, + "step": 91560 + }, + { + "epoch": 0.8395525809113413, + "learning_rate": 3.209131750252132e-05, + "loss": 1.021, + "mean_token_accuracy": 0.6990630745887756, + "num_tokens": 223398545.0, + "step": 91570 + }, + { + "epoch": 0.8396442651508206, + "learning_rate": 3.207298065462547e-05, + "loss": 1.0004, + "mean_token_accuracy": 0.7005080997943878, + "num_tokens": 223428995.0, + "step": 91580 + }, + { + "epoch": 0.8397359493902998, + "learning_rate": 3.205464380672962e-05, + "loss": 1.0029, + "mean_token_accuracy": 0.7037331581115722, + "num_tokens": 223459170.0, + "step": 91590 + }, + { + "epoch": 0.8398276336297791, + "learning_rate": 3.203630695883378e-05, + "loss": 1.0277, + "mean_token_accuracy": 0.7013119220733642, + "num_tokens": 223489915.0, + "step": 91600 + }, + { + "epoch": 0.8399193178692582, + "learning_rate": 3.201797011093793e-05, + "loss": 0.9914, + "mean_token_accuracy": 0.7053504765033722, + "num_tokens": 223520451.0, + "step": 91610 + }, + { + "epoch": 0.8400110021087375, + "learning_rate": 3.1999633263042085e-05, + "loss": 0.9655, + "mean_token_accuracy": 0.7083058834075928, + "num_tokens": 223548955.0, + "step": 91620 + }, + { + "epoch": 0.8401026863482167, + "learning_rate": 3.198129641514624e-05, + "loss": 1.0169, + "mean_token_accuracy": 0.7000997841358185, + "num_tokens": 223580163.0, + "step": 91630 + }, + { + "epoch": 0.840194370587696, + "learning_rate": 3.196295956725039e-05, + "loss": 0.9834, + "mean_token_accuracy": 0.6998641967773438, + "num_tokens": 223611275.0, + "step": 91640 + }, + { + "epoch": 0.8402860548271752, + "learning_rate": 3.194462271935455e-05, + "loss": 0.9652, + "mean_token_accuracy": 0.7117608606815338, + "num_tokens": 223641395.0, + "step": 91650 + }, + { + "epoch": 0.8403777390666545, + "learning_rate": 3.19262858714587e-05, + "loss": 1.0022, + "mean_token_accuracy": 0.7010492026805878, + "num_tokens": 223671826.0, + "step": 91660 + }, + { + "epoch": 0.8404694233061337, + "learning_rate": 3.190794902356285e-05, + "loss": 0.9946, + "mean_token_accuracy": 0.7014322578907013, + "num_tokens": 223702931.0, + "step": 91670 + }, + { + "epoch": 0.8405611075456129, + "learning_rate": 3.1889612175667e-05, + "loss": 0.9705, + "mean_token_accuracy": 0.7093854248523712, + "num_tokens": 223731713.0, + "step": 91680 + }, + { + "epoch": 0.8406527917850921, + "learning_rate": 3.1871275327771155e-05, + "loss": 1.0141, + "mean_token_accuracy": 0.7003601014614105, + "num_tokens": 223763117.0, + "step": 91690 + }, + { + "epoch": 0.8407444760245714, + "learning_rate": 3.1852938479875314e-05, + "loss": 1.003, + "mean_token_accuracy": 0.7010448932647705, + "num_tokens": 223793505.0, + "step": 91700 + }, + { + "epoch": 0.8408361602640506, + "learning_rate": 3.1834601631979465e-05, + "loss": 1.0087, + "mean_token_accuracy": 0.7001794517040253, + "num_tokens": 223824394.0, + "step": 91710 + }, + { + "epoch": 0.8409278445035299, + "learning_rate": 3.181626478408362e-05, + "loss": 0.9893, + "mean_token_accuracy": 0.7095170080661773, + "num_tokens": 223856529.0, + "step": 91720 + }, + { + "epoch": 0.8410195287430091, + "learning_rate": 3.179792793618777e-05, + "loss": 1.0034, + "mean_token_accuracy": 0.7024901330471038, + "num_tokens": 223886958.0, + "step": 91730 + }, + { + "epoch": 0.8411112129824884, + "learning_rate": 3.177959108829193e-05, + "loss": 0.9706, + "mean_token_accuracy": 0.7048344671726227, + "num_tokens": 223914994.0, + "step": 91740 + }, + { + "epoch": 0.8412028972219675, + "learning_rate": 3.176125424039608e-05, + "loss": 1.0093, + "mean_token_accuracy": 0.7007959365844727, + "num_tokens": 223946012.0, + "step": 91750 + }, + { + "epoch": 0.8412945814614468, + "learning_rate": 3.174291739250023e-05, + "loss": 0.9975, + "mean_token_accuracy": 0.7080795049667359, + "num_tokens": 223976892.0, + "step": 91760 + }, + { + "epoch": 0.841386265700926, + "learning_rate": 3.1724580544604383e-05, + "loss": 1.0113, + "mean_token_accuracy": 0.7008758664131165, + "num_tokens": 224008730.0, + "step": 91770 + }, + { + "epoch": 0.8414779499404053, + "learning_rate": 3.1706243696708535e-05, + "loss": 1.0137, + "mean_token_accuracy": 0.6989102780818939, + "num_tokens": 224040108.0, + "step": 91780 + }, + { + "epoch": 0.8415696341798845, + "learning_rate": 3.1687906848812694e-05, + "loss": 1.0018, + "mean_token_accuracy": 0.7042802751064301, + "num_tokens": 224070662.0, + "step": 91790 + }, + { + "epoch": 0.8416613184193638, + "learning_rate": 3.1669570000916846e-05, + "loss": 0.9769, + "mean_token_accuracy": 0.7085938453674316, + "num_tokens": 224098487.0, + "step": 91800 + }, + { + "epoch": 0.8417530026588429, + "learning_rate": 3.1651233153021e-05, + "loss": 0.9952, + "mean_token_accuracy": 0.7060381650924683, + "num_tokens": 224128721.0, + "step": 91810 + }, + { + "epoch": 0.8418446868983221, + "learning_rate": 3.163289630512515e-05, + "loss": 0.9723, + "mean_token_accuracy": 0.7097331464290619, + "num_tokens": 224158648.0, + "step": 91820 + }, + { + "epoch": 0.8419363711378014, + "learning_rate": 3.16145594572293e-05, + "loss": 1.0277, + "mean_token_accuracy": 0.699338573217392, + "num_tokens": 224189975.0, + "step": 91830 + }, + { + "epoch": 0.8420280553772806, + "learning_rate": 3.159622260933346e-05, + "loss": 0.9778, + "mean_token_accuracy": 0.7073618948459626, + "num_tokens": 224220671.0, + "step": 91840 + }, + { + "epoch": 0.8421197396167599, + "learning_rate": 3.157788576143761e-05, + "loss": 0.9942, + "mean_token_accuracy": 0.7037886440753937, + "num_tokens": 224251242.0, + "step": 91850 + }, + { + "epoch": 0.8422114238562391, + "learning_rate": 3.1559548913541764e-05, + "loss": 0.9671, + "mean_token_accuracy": 0.7061097323894501, + "num_tokens": 224279067.0, + "step": 91860 + }, + { + "epoch": 0.8423031080957184, + "learning_rate": 3.1541212065645916e-05, + "loss": 1.021, + "mean_token_accuracy": 0.6982515513896942, + "num_tokens": 224310698.0, + "step": 91870 + }, + { + "epoch": 0.8423947923351975, + "learning_rate": 3.152287521775007e-05, + "loss": 1.0091, + "mean_token_accuracy": 0.7030785799026489, + "num_tokens": 224341772.0, + "step": 91880 + }, + { + "epoch": 0.8424864765746768, + "learning_rate": 3.1504538369854226e-05, + "loss": 1.0125, + "mean_token_accuracy": 0.6984831392765045, + "num_tokens": 224371944.0, + "step": 91890 + }, + { + "epoch": 0.842578160814156, + "learning_rate": 3.148620152195838e-05, + "loss": 0.9942, + "mean_token_accuracy": 0.7027344167232513, + "num_tokens": 224403172.0, + "step": 91900 + }, + { + "epoch": 0.8426698450536353, + "learning_rate": 3.146786467406253e-05, + "loss": 0.9834, + "mean_token_accuracy": 0.7057047128677368, + "num_tokens": 224432314.0, + "step": 91910 + }, + { + "epoch": 0.8427615292931145, + "learning_rate": 3.144952782616669e-05, + "loss": 0.987, + "mean_token_accuracy": 0.7073067247867584, + "num_tokens": 224461293.0, + "step": 91920 + }, + { + "epoch": 0.8428532135325938, + "learning_rate": 3.1431190978270834e-05, + "loss": 1.0092, + "mean_token_accuracy": 0.6986635565757752, + "num_tokens": 224491704.0, + "step": 91930 + }, + { + "epoch": 0.8429448977720729, + "learning_rate": 3.141285413037499e-05, + "loss": 0.9689, + "mean_token_accuracy": 0.7099559724330902, + "num_tokens": 224522159.0, + "step": 91940 + }, + { + "epoch": 0.8430365820115522, + "learning_rate": 3.1394517282479144e-05, + "loss": 1.0004, + "mean_token_accuracy": 0.7031835913658142, + "num_tokens": 224553742.0, + "step": 91950 + }, + { + "epoch": 0.8431282662510314, + "learning_rate": 3.1376180434583296e-05, + "loss": 0.9605, + "mean_token_accuracy": 0.7088021457195282, + "num_tokens": 224584837.0, + "step": 91960 + }, + { + "epoch": 0.8432199504905107, + "learning_rate": 3.1357843586687455e-05, + "loss": 0.9923, + "mean_token_accuracy": 0.7099215149879455, + "num_tokens": 224614366.0, + "step": 91970 + }, + { + "epoch": 0.8433116347299899, + "learning_rate": 3.13395067387916e-05, + "loss": 1.0107, + "mean_token_accuracy": 0.6980745732784271, + "num_tokens": 224643211.0, + "step": 91980 + }, + { + "epoch": 0.8434033189694692, + "learning_rate": 3.132116989089576e-05, + "loss": 1.0051, + "mean_token_accuracy": 0.7066904246807099, + "num_tokens": 224674876.0, + "step": 91990 + }, + { + "epoch": 0.8434950032089484, + "learning_rate": 3.130283304299991e-05, + "loss": 0.992, + "mean_token_accuracy": 0.7022707223892212, + "num_tokens": 224706286.0, + "step": 92000 + }, + { + "epoch": 0.8435866874484276, + "learning_rate": 3.128449619510406e-05, + "loss": 1.0358, + "mean_token_accuracy": 0.6943967401981354, + "num_tokens": 224735673.0, + "step": 92010 + }, + { + "epoch": 0.8436783716879068, + "learning_rate": 3.126615934720822e-05, + "loss": 0.984, + "mean_token_accuracy": 0.7018739461898804, + "num_tokens": 224766405.0, + "step": 92020 + }, + { + "epoch": 0.8437700559273861, + "learning_rate": 3.1247822499312366e-05, + "loss": 0.9948, + "mean_token_accuracy": 0.700128835439682, + "num_tokens": 224796389.0, + "step": 92030 + }, + { + "epoch": 0.8438617401668653, + "learning_rate": 3.1229485651416525e-05, + "loss": 1.0073, + "mean_token_accuracy": 0.7004628121852875, + "num_tokens": 224823526.0, + "step": 92040 + }, + { + "epoch": 0.8439534244063446, + "learning_rate": 3.1211148803520676e-05, + "loss": 1.0031, + "mean_token_accuracy": 0.6994020581245423, + "num_tokens": 224854352.0, + "step": 92050 + }, + { + "epoch": 0.8440451086458238, + "learning_rate": 3.119281195562483e-05, + "loss": 1.0303, + "mean_token_accuracy": 0.6925749242305755, + "num_tokens": 224884760.0, + "step": 92060 + }, + { + "epoch": 0.844136792885303, + "learning_rate": 3.117447510772899e-05, + "loss": 0.9964, + "mean_token_accuracy": 0.7054547429084778, + "num_tokens": 224915431.0, + "step": 92070 + }, + { + "epoch": 0.8442284771247822, + "learning_rate": 3.115613825983313e-05, + "loss": 0.9917, + "mean_token_accuracy": 0.7053548216819763, + "num_tokens": 224947166.0, + "step": 92080 + }, + { + "epoch": 0.8443201613642615, + "learning_rate": 3.113780141193729e-05, + "loss": 0.9829, + "mean_token_accuracy": 0.7075178861618042, + "num_tokens": 224977578.0, + "step": 92090 + }, + { + "epoch": 0.8444118456037407, + "learning_rate": 3.111946456404144e-05, + "loss": 0.9719, + "mean_token_accuracy": 0.7024227261543274, + "num_tokens": 225005512.0, + "step": 92100 + }, + { + "epoch": 0.84450352984322, + "learning_rate": 3.1101127716145594e-05, + "loss": 0.9747, + "mean_token_accuracy": 0.7060999393463134, + "num_tokens": 225036673.0, + "step": 92110 + }, + { + "epoch": 0.8445952140826992, + "learning_rate": 3.108279086824975e-05, + "loss": 1.0147, + "mean_token_accuracy": 0.6976794540882111, + "num_tokens": 225068821.0, + "step": 92120 + }, + { + "epoch": 0.8446868983221785, + "learning_rate": 3.10644540203539e-05, + "loss": 1.0105, + "mean_token_accuracy": 0.7012093305587769, + "num_tokens": 225099406.0, + "step": 92130 + }, + { + "epoch": 0.8447785825616576, + "learning_rate": 3.104611717245806e-05, + "loss": 1.0045, + "mean_token_accuracy": 0.7001675188541412, + "num_tokens": 225129722.0, + "step": 92140 + }, + { + "epoch": 0.8448702668011369, + "learning_rate": 3.102778032456221e-05, + "loss": 0.9859, + "mean_token_accuracy": 0.7040951013565063, + "num_tokens": 225160334.0, + "step": 92150 + }, + { + "epoch": 0.8449619510406161, + "learning_rate": 3.100944347666636e-05, + "loss": 0.9732, + "mean_token_accuracy": 0.7056873083114624, + "num_tokens": 225188221.0, + "step": 92160 + }, + { + "epoch": 0.8450536352800954, + "learning_rate": 3.099110662877052e-05, + "loss": 0.9988, + "mean_token_accuracy": 0.7046827554702759, + "num_tokens": 225218756.0, + "step": 92170 + }, + { + "epoch": 0.8451453195195746, + "learning_rate": 3.0972769780874664e-05, + "loss": 0.9929, + "mean_token_accuracy": 0.7025894045829773, + "num_tokens": 225248959.0, + "step": 92180 + }, + { + "epoch": 0.8452370037590539, + "learning_rate": 3.095443293297882e-05, + "loss": 1.0225, + "mean_token_accuracy": 0.6961394786834717, + "num_tokens": 225279958.0, + "step": 92190 + }, + { + "epoch": 0.845328687998533, + "learning_rate": 3.0936096085082975e-05, + "loss": 0.9839, + "mean_token_accuracy": 0.70698561668396, + "num_tokens": 225310359.0, + "step": 92200 + }, + { + "epoch": 0.8454203722380123, + "learning_rate": 3.0917759237187127e-05, + "loss": 1.0208, + "mean_token_accuracy": 0.696915727853775, + "num_tokens": 225341492.0, + "step": 92210 + }, + { + "epoch": 0.8455120564774915, + "learning_rate": 3.0899422389291285e-05, + "loss": 0.9691, + "mean_token_accuracy": 0.7075960218906403, + "num_tokens": 225369895.0, + "step": 92220 + }, + { + "epoch": 0.8456037407169708, + "learning_rate": 3.088108554139544e-05, + "loss": 1.0033, + "mean_token_accuracy": 0.7020844161510468, + "num_tokens": 225400552.0, + "step": 92230 + }, + { + "epoch": 0.84569542495645, + "learning_rate": 3.086274869349959e-05, + "loss": 0.9857, + "mean_token_accuracy": 0.7039596199989319, + "num_tokens": 225431494.0, + "step": 92240 + }, + { + "epoch": 0.8457871091959293, + "learning_rate": 3.084441184560374e-05, + "loss": 0.9952, + "mean_token_accuracy": 0.7030720889568329, + "num_tokens": 225462254.0, + "step": 92250 + }, + { + "epoch": 0.8458787934354085, + "learning_rate": 3.082607499770789e-05, + "loss": 1.0347, + "mean_token_accuracy": 0.6975192964076996, + "num_tokens": 225492772.0, + "step": 92260 + }, + { + "epoch": 0.8459704776748876, + "learning_rate": 3.080773814981205e-05, + "loss": 0.9845, + "mean_token_accuracy": 0.7059388339519501, + "num_tokens": 225522832.0, + "step": 92270 + }, + { + "epoch": 0.8460621619143669, + "learning_rate": 3.07894013019162e-05, + "loss": 0.9733, + "mean_token_accuracy": 0.7059954524040222, + "num_tokens": 225552321.0, + "step": 92280 + }, + { + "epoch": 0.8461538461538461, + "learning_rate": 3.0771064454020355e-05, + "loss": 1.0148, + "mean_token_accuracy": 0.6935909867286683, + "num_tokens": 225582357.0, + "step": 92290 + }, + { + "epoch": 0.8462455303933254, + "learning_rate": 3.075272760612451e-05, + "loss": 0.9941, + "mean_token_accuracy": 0.7026721596717834, + "num_tokens": 225613377.0, + "step": 92300 + }, + { + "epoch": 0.8463372146328046, + "learning_rate": 3.073439075822866e-05, + "loss": 1.0023, + "mean_token_accuracy": 0.703583025932312, + "num_tokens": 225643992.0, + "step": 92310 + }, + { + "epoch": 0.8464288988722839, + "learning_rate": 3.071605391033282e-05, + "loss": 0.9809, + "mean_token_accuracy": 0.70487340092659, + "num_tokens": 225674099.0, + "step": 92320 + }, + { + "epoch": 0.846520583111763, + "learning_rate": 3.069771706243697e-05, + "loss": 0.9966, + "mean_token_accuracy": 0.6940248966217041, + "num_tokens": 225704104.0, + "step": 92330 + }, + { + "epoch": 0.8466122673512423, + "learning_rate": 3.067938021454112e-05, + "loss": 0.9931, + "mean_token_accuracy": 0.7026736319065094, + "num_tokens": 225733018.0, + "step": 92340 + }, + { + "epoch": 0.8467039515907215, + "learning_rate": 3.066104336664527e-05, + "loss": 0.9937, + "mean_token_accuracy": 0.7105529487133027, + "num_tokens": 225763917.0, + "step": 92350 + }, + { + "epoch": 0.8467956358302008, + "learning_rate": 3.064270651874943e-05, + "loss": 0.999, + "mean_token_accuracy": 0.7028055250644684, + "num_tokens": 225795207.0, + "step": 92360 + }, + { + "epoch": 0.84688732006968, + "learning_rate": 3.0624369670853584e-05, + "loss": 1.003, + "mean_token_accuracy": 0.7021788954734802, + "num_tokens": 225825180.0, + "step": 92370 + }, + { + "epoch": 0.8469790043091593, + "learning_rate": 3.0606032822957735e-05, + "loss": 0.9792, + "mean_token_accuracy": 0.7024985313415527, + "num_tokens": 225855340.0, + "step": 92380 + }, + { + "epoch": 0.8470706885486385, + "learning_rate": 3.058769597506189e-05, + "loss": 1.0036, + "mean_token_accuracy": 0.7014451801776886, + "num_tokens": 225885618.0, + "step": 92390 + }, + { + "epoch": 0.8471623727881177, + "learning_rate": 3.056935912716604e-05, + "loss": 0.9674, + "mean_token_accuracy": 0.7104009866714478, + "num_tokens": 225914346.0, + "step": 92400 + }, + { + "epoch": 0.8472540570275969, + "learning_rate": 3.05510222792702e-05, + "loss": 0.9999, + "mean_token_accuracy": 0.7026920735836029, + "num_tokens": 225945234.0, + "step": 92410 + }, + { + "epoch": 0.8473457412670762, + "learning_rate": 3.053268543137435e-05, + "loss": 0.996, + "mean_token_accuracy": 0.7054856359958649, + "num_tokens": 225976466.0, + "step": 92420 + }, + { + "epoch": 0.8474374255065554, + "learning_rate": 3.05143485834785e-05, + "loss": 0.9868, + "mean_token_accuracy": 0.7047296702861786, + "num_tokens": 226007524.0, + "step": 92430 + }, + { + "epoch": 0.8475291097460347, + "learning_rate": 3.0496011735582653e-05, + "loss": 1.0165, + "mean_token_accuracy": 0.696868097782135, + "num_tokens": 226037824.0, + "step": 92440 + }, + { + "epoch": 0.8476207939855139, + "learning_rate": 3.047767488768681e-05, + "loss": 0.9866, + "mean_token_accuracy": 0.7058529853820801, + "num_tokens": 226067719.0, + "step": 92450 + }, + { + "epoch": 0.8477124782249931, + "learning_rate": 3.0459338039790964e-05, + "loss": 0.9797, + "mean_token_accuracy": 0.7003554463386535, + "num_tokens": 226096110.0, + "step": 92460 + }, + { + "epoch": 0.8478041624644723, + "learning_rate": 3.0441001191895112e-05, + "loss": 0.973, + "mean_token_accuracy": 0.7082064628601075, + "num_tokens": 226127058.0, + "step": 92470 + }, + { + "epoch": 0.8478958467039516, + "learning_rate": 3.0422664343999268e-05, + "loss": 1.0354, + "mean_token_accuracy": 0.6950591146945954, + "num_tokens": 226158699.0, + "step": 92480 + }, + { + "epoch": 0.8479875309434308, + "learning_rate": 3.040432749610342e-05, + "loss": 1.0177, + "mean_token_accuracy": 0.700346302986145, + "num_tokens": 226190250.0, + "step": 92490 + }, + { + "epoch": 0.8480792151829101, + "learning_rate": 3.0385990648207575e-05, + "loss": 0.9955, + "mean_token_accuracy": 0.7033508360385895, + "num_tokens": 226219946.0, + "step": 92500 + }, + { + "epoch": 0.8481708994223893, + "learning_rate": 3.036765380031173e-05, + "loss": 0.9986, + "mean_token_accuracy": 0.6954771339893341, + "num_tokens": 226250130.0, + "step": 92510 + }, + { + "epoch": 0.8482625836618686, + "learning_rate": 3.034931695241588e-05, + "loss": 0.9591, + "mean_token_accuracy": 0.7096432268619537, + "num_tokens": 226277856.0, + "step": 92520 + }, + { + "epoch": 0.8483542679013477, + "learning_rate": 3.0330980104520034e-05, + "loss": 0.9792, + "mean_token_accuracy": 0.7000100553035736, + "num_tokens": 226308809.0, + "step": 92530 + }, + { + "epoch": 0.848445952140827, + "learning_rate": 3.031264325662419e-05, + "loss": 0.9898, + "mean_token_accuracy": 0.7065817296504975, + "num_tokens": 226338960.0, + "step": 92540 + }, + { + "epoch": 0.8485376363803062, + "learning_rate": 3.029430640872834e-05, + "loss": 1.0085, + "mean_token_accuracy": 0.7020676970481873, + "num_tokens": 226369586.0, + "step": 92550 + }, + { + "epoch": 0.8486293206197855, + "learning_rate": 3.0275969560832496e-05, + "loss": 1.0288, + "mean_token_accuracy": 0.7000457465648651, + "num_tokens": 226400590.0, + "step": 92560 + }, + { + "epoch": 0.8487210048592647, + "learning_rate": 3.0257632712936645e-05, + "loss": 0.9855, + "mean_token_accuracy": 0.7003734707832336, + "num_tokens": 226429608.0, + "step": 92570 + }, + { + "epoch": 0.848812689098744, + "learning_rate": 3.02392958650408e-05, + "loss": 1.0009, + "mean_token_accuracy": 0.7032172381877899, + "num_tokens": 226458672.0, + "step": 92580 + }, + { + "epoch": 0.8489043733382231, + "learning_rate": 3.0220959017144955e-05, + "loss": 0.9864, + "mean_token_accuracy": 0.7043384611606598, + "num_tokens": 226490294.0, + "step": 92590 + }, + { + "epoch": 0.8489960575777024, + "learning_rate": 3.0202622169249107e-05, + "loss": 0.9927, + "mean_token_accuracy": 0.7044949352741241, + "num_tokens": 226521305.0, + "step": 92600 + }, + { + "epoch": 0.8490877418171816, + "learning_rate": 3.0184285321353262e-05, + "loss": 0.9948, + "mean_token_accuracy": 0.7017820060253144, + "num_tokens": 226551759.0, + "step": 92610 + }, + { + "epoch": 0.8491794260566609, + "learning_rate": 3.016594847345741e-05, + "loss": 0.9957, + "mean_token_accuracy": 0.70472252368927, + "num_tokens": 226582424.0, + "step": 92620 + }, + { + "epoch": 0.8492711102961401, + "learning_rate": 3.0147611625561566e-05, + "loss": 0.9818, + "mean_token_accuracy": 0.7079247176647187, + "num_tokens": 226611851.0, + "step": 92630 + }, + { + "epoch": 0.8493627945356194, + "learning_rate": 3.012927477766572e-05, + "loss": 1.0019, + "mean_token_accuracy": 0.6940906465053558, + "num_tokens": 226639158.0, + "step": 92640 + }, + { + "epoch": 0.8494544787750986, + "learning_rate": 3.0110937929769873e-05, + "loss": 0.9949, + "mean_token_accuracy": 0.7073172271251679, + "num_tokens": 226669578.0, + "step": 92650 + }, + { + "epoch": 0.8495461630145777, + "learning_rate": 3.009260108187403e-05, + "loss": 0.9883, + "mean_token_accuracy": 0.7053599774837493, + "num_tokens": 226700559.0, + "step": 92660 + }, + { + "epoch": 0.849637847254057, + "learning_rate": 3.0074264233978184e-05, + "loss": 1.0105, + "mean_token_accuracy": 0.7003489255905151, + "num_tokens": 226731054.0, + "step": 92670 + }, + { + "epoch": 0.8497295314935362, + "learning_rate": 3.0055927386082332e-05, + "loss": 1.0094, + "mean_token_accuracy": 0.7078044176101684, + "num_tokens": 226762562.0, + "step": 92680 + }, + { + "epoch": 0.8498212157330155, + "learning_rate": 3.0037590538186487e-05, + "loss": 0.9634, + "mean_token_accuracy": 0.7059079289436341, + "num_tokens": 226793398.0, + "step": 92690 + }, + { + "epoch": 0.8499128999724948, + "learning_rate": 3.001925369029064e-05, + "loss": 0.9902, + "mean_token_accuracy": 0.697595739364624, + "num_tokens": 226821303.0, + "step": 92700 + }, + { + "epoch": 0.850004584211974, + "learning_rate": 3.0000916842394795e-05, + "loss": 1.0235, + "mean_token_accuracy": 0.6974358201026917, + "num_tokens": 226852263.0, + "step": 92710 + }, + { + "epoch": 0.8500962684514531, + "learning_rate": 2.998257999449895e-05, + "loss": 0.9852, + "mean_token_accuracy": 0.7041719734668732, + "num_tokens": 226884205.0, + "step": 92720 + }, + { + "epoch": 0.8501879526909324, + "learning_rate": 2.9964243146603098e-05, + "loss": 0.9983, + "mean_token_accuracy": 0.7009266495704651, + "num_tokens": 226914671.0, + "step": 92730 + }, + { + "epoch": 0.8502796369304116, + "learning_rate": 2.9945906298707254e-05, + "loss": 0.9967, + "mean_token_accuracy": 0.70213183760643, + "num_tokens": 226946000.0, + "step": 92740 + }, + { + "epoch": 0.8503713211698909, + "learning_rate": 2.9927569450811405e-05, + "loss": 0.9985, + "mean_token_accuracy": 0.7022172152996063, + "num_tokens": 226977389.0, + "step": 92750 + }, + { + "epoch": 0.8504630054093701, + "learning_rate": 2.990923260291556e-05, + "loss": 0.9854, + "mean_token_accuracy": 0.701825100183487, + "num_tokens": 227005215.0, + "step": 92760 + }, + { + "epoch": 0.8505546896488494, + "learning_rate": 2.9890895755019716e-05, + "loss": 0.993, + "mean_token_accuracy": 0.7050695061683655, + "num_tokens": 227035909.0, + "step": 92770 + }, + { + "epoch": 0.8506463738883286, + "learning_rate": 2.9872558907123864e-05, + "loss": 1.024, + "mean_token_accuracy": 0.6951681792736053, + "num_tokens": 227066372.0, + "step": 92780 + }, + { + "epoch": 0.8507380581278078, + "learning_rate": 2.985422205922802e-05, + "loss": 0.9706, + "mean_token_accuracy": 0.7126036167144776, + "num_tokens": 227096199.0, + "step": 92790 + }, + { + "epoch": 0.850829742367287, + "learning_rate": 2.983588521133217e-05, + "loss": 0.988, + "mean_token_accuracy": 0.7058151662349701, + "num_tokens": 227126512.0, + "step": 92800 + }, + { + "epoch": 0.8509214266067663, + "learning_rate": 2.9817548363436327e-05, + "loss": 1.0053, + "mean_token_accuracy": 0.7011158227920532, + "num_tokens": 227157255.0, + "step": 92810 + }, + { + "epoch": 0.8510131108462455, + "learning_rate": 2.9799211515540482e-05, + "loss": 0.9595, + "mean_token_accuracy": 0.7099586308002472, + "num_tokens": 227185865.0, + "step": 92820 + }, + { + "epoch": 0.8511047950857248, + "learning_rate": 2.978087466764463e-05, + "loss": 1.0201, + "mean_token_accuracy": 0.694517332315445, + "num_tokens": 227216234.0, + "step": 92830 + }, + { + "epoch": 0.851196479325204, + "learning_rate": 2.9762537819748786e-05, + "loss": 1.0242, + "mean_token_accuracy": 0.6950756072998047, + "num_tokens": 227248508.0, + "step": 92840 + }, + { + "epoch": 0.8512881635646832, + "learning_rate": 2.974420097185294e-05, + "loss": 1.0285, + "mean_token_accuracy": 0.6953354895114898, + "num_tokens": 227279847.0, + "step": 92850 + }, + { + "epoch": 0.8513798478041624, + "learning_rate": 2.9725864123957093e-05, + "loss": 1.0041, + "mean_token_accuracy": 0.7030609607696533, + "num_tokens": 227309341.0, + "step": 92860 + }, + { + "epoch": 0.8514715320436417, + "learning_rate": 2.9707527276061248e-05, + "loss": 1.0174, + "mean_token_accuracy": 0.6984331011772156, + "num_tokens": 227339388.0, + "step": 92870 + }, + { + "epoch": 0.8515632162831209, + "learning_rate": 2.9689190428165397e-05, + "loss": 0.9989, + "mean_token_accuracy": 0.7009221613407135, + "num_tokens": 227367283.0, + "step": 92880 + }, + { + "epoch": 0.8516549005226002, + "learning_rate": 2.9670853580269552e-05, + "loss": 0.9628, + "mean_token_accuracy": 0.7050508320331573, + "num_tokens": 227396838.0, + "step": 92890 + }, + { + "epoch": 0.8517465847620794, + "learning_rate": 2.9652516732373707e-05, + "loss": 0.9862, + "mean_token_accuracy": 0.7043337821960449, + "num_tokens": 227427306.0, + "step": 92900 + }, + { + "epoch": 0.8518382690015587, + "learning_rate": 2.963417988447786e-05, + "loss": 1.0065, + "mean_token_accuracy": 0.6985112607479096, + "num_tokens": 227458049.0, + "step": 92910 + }, + { + "epoch": 0.8519299532410378, + "learning_rate": 2.9615843036582014e-05, + "loss": 0.9808, + "mean_token_accuracy": 0.7056490421295166, + "num_tokens": 227488684.0, + "step": 92920 + }, + { + "epoch": 0.8520216374805171, + "learning_rate": 2.9597506188686163e-05, + "loss": 0.9879, + "mean_token_accuracy": 0.6996640086174011, + "num_tokens": 227519462.0, + "step": 92930 + }, + { + "epoch": 0.8521133217199963, + "learning_rate": 2.9579169340790318e-05, + "loss": 0.9627, + "mean_token_accuracy": 0.7048620879650116, + "num_tokens": 227547906.0, + "step": 92940 + }, + { + "epoch": 0.8522050059594756, + "learning_rate": 2.9560832492894473e-05, + "loss": 0.9794, + "mean_token_accuracy": 0.7041147887706757, + "num_tokens": 227578381.0, + "step": 92950 + }, + { + "epoch": 0.8522966901989548, + "learning_rate": 2.9542495644998625e-05, + "loss": 1.0082, + "mean_token_accuracy": 0.6972006142139435, + "num_tokens": 227608937.0, + "step": 92960 + }, + { + "epoch": 0.8523883744384341, + "learning_rate": 2.952415879710278e-05, + "loss": 0.9965, + "mean_token_accuracy": 0.7008302807807922, + "num_tokens": 227637957.0, + "step": 92970 + }, + { + "epoch": 0.8524800586779133, + "learning_rate": 2.9505821949206936e-05, + "loss": 0.9912, + "mean_token_accuracy": 0.7032665610313416, + "num_tokens": 227668663.0, + "step": 92980 + }, + { + "epoch": 0.8525717429173925, + "learning_rate": 2.9487485101311084e-05, + "loss": 0.9642, + "mean_token_accuracy": 0.7147470891475678, + "num_tokens": 227699322.0, + "step": 92990 + }, + { + "epoch": 0.8526634271568717, + "learning_rate": 2.946914825341524e-05, + "loss": 0.9716, + "mean_token_accuracy": 0.7087487041950226, + "num_tokens": 227726986.0, + "step": 93000 + }, + { + "epoch": 0.852755111396351, + "learning_rate": 2.945081140551939e-05, + "loss": 0.9902, + "mean_token_accuracy": 0.7011621952056885, + "num_tokens": 227757175.0, + "step": 93010 + }, + { + "epoch": 0.8528467956358302, + "learning_rate": 2.9432474557623546e-05, + "loss": 0.9922, + "mean_token_accuracy": 0.7050215721130371, + "num_tokens": 227788463.0, + "step": 93020 + }, + { + "epoch": 0.8529384798753095, + "learning_rate": 2.9414137709727702e-05, + "loss": 1.0041, + "mean_token_accuracy": 0.7073045194149017, + "num_tokens": 227818333.0, + "step": 93030 + }, + { + "epoch": 0.8530301641147887, + "learning_rate": 2.939580086183185e-05, + "loss": 0.987, + "mean_token_accuracy": 0.7010485291481018, + "num_tokens": 227848632.0, + "step": 93040 + }, + { + "epoch": 0.8531218483542679, + "learning_rate": 2.9377464013936005e-05, + "loss": 0.9979, + "mean_token_accuracy": 0.7053632616996766, + "num_tokens": 227879608.0, + "step": 93050 + }, + { + "epoch": 0.8532135325937471, + "learning_rate": 2.9359127166040157e-05, + "loss": 0.9789, + "mean_token_accuracy": 0.7041413962841034, + "num_tokens": 227907252.0, + "step": 93060 + }, + { + "epoch": 0.8533052168332264, + "learning_rate": 2.9340790318144313e-05, + "loss": 0.9767, + "mean_token_accuracy": 0.7085775375366211, + "num_tokens": 227936995.0, + "step": 93070 + }, + { + "epoch": 0.8533969010727056, + "learning_rate": 2.9322453470248468e-05, + "loss": 0.9912, + "mean_token_accuracy": 0.7036928236484528, + "num_tokens": 227967171.0, + "step": 93080 + }, + { + "epoch": 0.8534885853121849, + "learning_rate": 2.9304116622352616e-05, + "loss": 1.0076, + "mean_token_accuracy": 0.7038045585155487, + "num_tokens": 227997434.0, + "step": 93090 + }, + { + "epoch": 0.8535802695516641, + "learning_rate": 2.928577977445677e-05, + "loss": 0.9962, + "mean_token_accuracy": 0.7029118537902832, + "num_tokens": 228028749.0, + "step": 93100 + }, + { + "epoch": 0.8536719537911434, + "learning_rate": 2.9267442926560923e-05, + "loss": 0.9875, + "mean_token_accuracy": 0.7051879584789276, + "num_tokens": 228059345.0, + "step": 93110 + }, + { + "epoch": 0.8537636380306225, + "learning_rate": 2.924910607866508e-05, + "loss": 0.9984, + "mean_token_accuracy": 0.6979428648948669, + "num_tokens": 228087885.0, + "step": 93120 + }, + { + "epoch": 0.8538553222701017, + "learning_rate": 2.9230769230769234e-05, + "loss": 0.9948, + "mean_token_accuracy": 0.6957296907901764, + "num_tokens": 228117280.0, + "step": 93130 + }, + { + "epoch": 0.853947006509581, + "learning_rate": 2.9212432382873382e-05, + "loss": 1.021, + "mean_token_accuracy": 0.6990654051303864, + "num_tokens": 228148102.0, + "step": 93140 + }, + { + "epoch": 0.8540386907490602, + "learning_rate": 2.9194095534977538e-05, + "loss": 1.0296, + "mean_token_accuracy": 0.6973524630069733, + "num_tokens": 228178163.0, + "step": 93150 + }, + { + "epoch": 0.8541303749885395, + "learning_rate": 2.9175758687081693e-05, + "loss": 1.0202, + "mean_token_accuracy": 0.6996358692646026, + "num_tokens": 228209516.0, + "step": 93160 + }, + { + "epoch": 0.8542220592280187, + "learning_rate": 2.9157421839185845e-05, + "loss": 1.0032, + "mean_token_accuracy": 0.7008218824863434, + "num_tokens": 228240313.0, + "step": 93170 + }, + { + "epoch": 0.8543137434674979, + "learning_rate": 2.913908499129e-05, + "loss": 0.9588, + "mean_token_accuracy": 0.7090696334838867, + "num_tokens": 228267800.0, + "step": 93180 + }, + { + "epoch": 0.8544054277069771, + "learning_rate": 2.912074814339415e-05, + "loss": 1.0105, + "mean_token_accuracy": 0.6994145393371582, + "num_tokens": 228297318.0, + "step": 93190 + }, + { + "epoch": 0.8544971119464564, + "learning_rate": 2.9102411295498304e-05, + "loss": 0.9708, + "mean_token_accuracy": 0.706597113609314, + "num_tokens": 228328054.0, + "step": 93200 + }, + { + "epoch": 0.8545887961859356, + "learning_rate": 2.908407444760246e-05, + "loss": 0.9846, + "mean_token_accuracy": 0.7094608187675476, + "num_tokens": 228358528.0, + "step": 93210 + }, + { + "epoch": 0.8546804804254149, + "learning_rate": 2.906573759970661e-05, + "loss": 0.9662, + "mean_token_accuracy": 0.7111461758613586, + "num_tokens": 228388798.0, + "step": 93220 + }, + { + "epoch": 0.8547721646648941, + "learning_rate": 2.9047400751810766e-05, + "loss": 0.9762, + "mean_token_accuracy": 0.7065777361392975, + "num_tokens": 228418669.0, + "step": 93230 + }, + { + "epoch": 0.8548638489043734, + "learning_rate": 2.9029063903914915e-05, + "loss": 0.9534, + "mean_token_accuracy": 0.707000195980072, + "num_tokens": 228446004.0, + "step": 93240 + }, + { + "epoch": 0.8549555331438525, + "learning_rate": 2.901072705601907e-05, + "loss": 1.0229, + "mean_token_accuracy": 0.6997511804103851, + "num_tokens": 228476661.0, + "step": 93250 + }, + { + "epoch": 0.8550472173833318, + "learning_rate": 2.8992390208123225e-05, + "loss": 0.9833, + "mean_token_accuracy": 0.7088791608810425, + "num_tokens": 228506208.0, + "step": 93260 + }, + { + "epoch": 0.855138901622811, + "learning_rate": 2.8974053360227377e-05, + "loss": 1.0133, + "mean_token_accuracy": 0.7014099001884461, + "num_tokens": 228537490.0, + "step": 93270 + }, + { + "epoch": 0.8552305858622903, + "learning_rate": 2.8955716512331532e-05, + "loss": 0.9899, + "mean_token_accuracy": 0.7015993654727936, + "num_tokens": 228568692.0, + "step": 93280 + }, + { + "epoch": 0.8553222701017695, + "learning_rate": 2.8937379664435688e-05, + "loss": 1.002, + "mean_token_accuracy": 0.7001181602478027, + "num_tokens": 228598813.0, + "step": 93290 + }, + { + "epoch": 0.8554139543412488, + "learning_rate": 2.8919042816539836e-05, + "loss": 0.9799, + "mean_token_accuracy": 0.7049507439136505, + "num_tokens": 228627304.0, + "step": 93300 + }, + { + "epoch": 0.8555056385807279, + "learning_rate": 2.890070596864399e-05, + "loss": 1.0223, + "mean_token_accuracy": 0.696961623430252, + "num_tokens": 228657602.0, + "step": 93310 + }, + { + "epoch": 0.8555973228202072, + "learning_rate": 2.8882369120748143e-05, + "loss": 1.0106, + "mean_token_accuracy": 0.701234781742096, + "num_tokens": 228689627.0, + "step": 93320 + }, + { + "epoch": 0.8556890070596864, + "learning_rate": 2.88640322728523e-05, + "loss": 0.9927, + "mean_token_accuracy": 0.7064007699489594, + "num_tokens": 228720524.0, + "step": 93330 + }, + { + "epoch": 0.8557806912991657, + "learning_rate": 2.8845695424956454e-05, + "loss": 0.9997, + "mean_token_accuracy": 0.7018190264701843, + "num_tokens": 228750989.0, + "step": 93340 + }, + { + "epoch": 0.8558723755386449, + "learning_rate": 2.8827358577060602e-05, + "loss": 1.0075, + "mean_token_accuracy": 0.7025477647781372, + "num_tokens": 228781701.0, + "step": 93350 + }, + { + "epoch": 0.8559640597781242, + "learning_rate": 2.8809021729164757e-05, + "loss": 0.9801, + "mean_token_accuracy": 0.7058349132537842, + "num_tokens": 228811126.0, + "step": 93360 + }, + { + "epoch": 0.8560557440176034, + "learning_rate": 2.879068488126891e-05, + "loss": 0.9824, + "mean_token_accuracy": 0.7093196511268616, + "num_tokens": 228841124.0, + "step": 93370 + }, + { + "epoch": 0.8561474282570826, + "learning_rate": 2.8772348033373065e-05, + "loss": 1.0145, + "mean_token_accuracy": 0.6966848611831665, + "num_tokens": 228872263.0, + "step": 93380 + }, + { + "epoch": 0.8562391124965618, + "learning_rate": 2.875401118547722e-05, + "loss": 0.9932, + "mean_token_accuracy": 0.7081319630146027, + "num_tokens": 228902807.0, + "step": 93390 + }, + { + "epoch": 0.8563307967360411, + "learning_rate": 2.8735674337581368e-05, + "loss": 1.0117, + "mean_token_accuracy": 0.698861300945282, + "num_tokens": 228933482.0, + "step": 93400 + }, + { + "epoch": 0.8564224809755203, + "learning_rate": 2.8717337489685524e-05, + "loss": 0.9978, + "mean_token_accuracy": 0.704002457857132, + "num_tokens": 228963433.0, + "step": 93410 + }, + { + "epoch": 0.8565141652149996, + "learning_rate": 2.8699000641789675e-05, + "loss": 0.9639, + "mean_token_accuracy": 0.7072536885738373, + "num_tokens": 228991320.0, + "step": 93420 + }, + { + "epoch": 0.8566058494544788, + "learning_rate": 2.868066379389383e-05, + "loss": 0.9952, + "mean_token_accuracy": 0.7035923779010773, + "num_tokens": 229022233.0, + "step": 93430 + }, + { + "epoch": 0.856697533693958, + "learning_rate": 2.8662326945997986e-05, + "loss": 0.9896, + "mean_token_accuracy": 0.7070930659770965, + "num_tokens": 229053338.0, + "step": 93440 + }, + { + "epoch": 0.8567892179334372, + "learning_rate": 2.8643990098102134e-05, + "loss": 0.986, + "mean_token_accuracy": 0.7019206285476685, + "num_tokens": 229084415.0, + "step": 93450 + }, + { + "epoch": 0.8568809021729165, + "learning_rate": 2.862565325020629e-05, + "loss": 0.9855, + "mean_token_accuracy": 0.7055654048919677, + "num_tokens": 229114439.0, + "step": 93460 + }, + { + "epoch": 0.8569725864123957, + "learning_rate": 2.8607316402310448e-05, + "loss": 0.9565, + "mean_token_accuracy": 0.7126664459705353, + "num_tokens": 229145282.0, + "step": 93470 + }, + { + "epoch": 0.857064270651875, + "learning_rate": 2.8588979554414597e-05, + "loss": 0.9589, + "mean_token_accuracy": 0.7095115303993225, + "num_tokens": 229174284.0, + "step": 93480 + }, + { + "epoch": 0.8571559548913542, + "learning_rate": 2.8570642706518752e-05, + "loss": 0.9664, + "mean_token_accuracy": 0.7075452685356141, + "num_tokens": 229205198.0, + "step": 93490 + }, + { + "epoch": 0.8572476391308335, + "learning_rate": 2.85523058586229e-05, + "loss": 1.0149, + "mean_token_accuracy": 0.6994210004806518, + "num_tokens": 229235339.0, + "step": 93500 + }, + { + "epoch": 0.8573393233703126, + "learning_rate": 2.8533969010727056e-05, + "loss": 0.9983, + "mean_token_accuracy": 0.7030344009399414, + "num_tokens": 229265819.0, + "step": 93510 + }, + { + "epoch": 0.8574310076097919, + "learning_rate": 2.8515632162831214e-05, + "loss": 0.9721, + "mean_token_accuracy": 0.7081470489501953, + "num_tokens": 229296826.0, + "step": 93520 + }, + { + "epoch": 0.8575226918492711, + "learning_rate": 2.8497295314935363e-05, + "loss": 0.9868, + "mean_token_accuracy": 0.7028627216815948, + "num_tokens": 229327198.0, + "step": 93530 + }, + { + "epoch": 0.8576143760887504, + "learning_rate": 2.8478958467039518e-05, + "loss": 0.9595, + "mean_token_accuracy": 0.7105356931686402, + "num_tokens": 229355379.0, + "step": 93540 + }, + { + "epoch": 0.8577060603282296, + "learning_rate": 2.8460621619143667e-05, + "loss": 1.0173, + "mean_token_accuracy": 0.7038970828056336, + "num_tokens": 229386855.0, + "step": 93550 + }, + { + "epoch": 0.8577977445677089, + "learning_rate": 2.8442284771247822e-05, + "loss": 0.97, + "mean_token_accuracy": 0.7084010183811188, + "num_tokens": 229417133.0, + "step": 93560 + }, + { + "epoch": 0.857889428807188, + "learning_rate": 2.842394792335198e-05, + "loss": 1.0135, + "mean_token_accuracy": 0.6986473262310028, + "num_tokens": 229448517.0, + "step": 93570 + }, + { + "epoch": 0.8579811130466672, + "learning_rate": 2.840561107545613e-05, + "loss": 0.9992, + "mean_token_accuracy": 0.6998164474964141, + "num_tokens": 229479214.0, + "step": 93580 + }, + { + "epoch": 0.8580727972861465, + "learning_rate": 2.8387274227560284e-05, + "loss": 0.9878, + "mean_token_accuracy": 0.7021778881549835, + "num_tokens": 229509169.0, + "step": 93590 + }, + { + "epoch": 0.8581644815256257, + "learning_rate": 2.836893737966444e-05, + "loss": 0.9576, + "mean_token_accuracy": 0.7058420538902282, + "num_tokens": 229537172.0, + "step": 93600 + }, + { + "epoch": 0.858256165765105, + "learning_rate": 2.835060053176859e-05, + "loss": 0.9875, + "mean_token_accuracy": 0.7006553530693054, + "num_tokens": 229567771.0, + "step": 93610 + }, + { + "epoch": 0.8583478500045842, + "learning_rate": 2.8332263683872747e-05, + "loss": 1.0289, + "mean_token_accuracy": 0.6926831424236297, + "num_tokens": 229598995.0, + "step": 93620 + }, + { + "epoch": 0.8584395342440635, + "learning_rate": 2.8313926835976895e-05, + "loss": 1.0102, + "mean_token_accuracy": 0.6992372453212738, + "num_tokens": 229629697.0, + "step": 93630 + }, + { + "epoch": 0.8585312184835426, + "learning_rate": 2.829558998808105e-05, + "loss": 1.0076, + "mean_token_accuracy": 0.7017565727233886, + "num_tokens": 229659414.0, + "step": 93640 + }, + { + "epoch": 0.8586229027230219, + "learning_rate": 2.8277253140185206e-05, + "loss": 1.0009, + "mean_token_accuracy": 0.7049071252346039, + "num_tokens": 229690851.0, + "step": 93650 + }, + { + "epoch": 0.8587145869625011, + "learning_rate": 2.8258916292289357e-05, + "loss": 0.9649, + "mean_token_accuracy": 0.7046798527240753, + "num_tokens": 229717969.0, + "step": 93660 + }, + { + "epoch": 0.8588062712019804, + "learning_rate": 2.8240579444393513e-05, + "loss": 1.0143, + "mean_token_accuracy": 0.699289733171463, + "num_tokens": 229749126.0, + "step": 93670 + }, + { + "epoch": 0.8588979554414596, + "learning_rate": 2.822224259649766e-05, + "loss": 1.0323, + "mean_token_accuracy": 0.6974205195903778, + "num_tokens": 229779925.0, + "step": 93680 + }, + { + "epoch": 0.8589896396809389, + "learning_rate": 2.8203905748601816e-05, + "loss": 0.9913, + "mean_token_accuracy": 0.7032601416110993, + "num_tokens": 229811482.0, + "step": 93690 + }, + { + "epoch": 0.859081323920418, + "learning_rate": 2.8185568900705972e-05, + "loss": 0.9861, + "mean_token_accuracy": 0.7054169058799744, + "num_tokens": 229842304.0, + "step": 93700 + }, + { + "epoch": 0.8591730081598973, + "learning_rate": 2.8167232052810124e-05, + "loss": 1.0035, + "mean_token_accuracy": 0.7035200297832489, + "num_tokens": 229872102.0, + "step": 93710 + }, + { + "epoch": 0.8592646923993765, + "learning_rate": 2.814889520491428e-05, + "loss": 0.9992, + "mean_token_accuracy": 0.7006593167781829, + "num_tokens": 229900293.0, + "step": 93720 + }, + { + "epoch": 0.8593563766388558, + "learning_rate": 2.8130558357018427e-05, + "loss": 0.9557, + "mean_token_accuracy": 0.710857379436493, + "num_tokens": 229931341.0, + "step": 93730 + }, + { + "epoch": 0.859448060878335, + "learning_rate": 2.8112221509122583e-05, + "loss": 0.9887, + "mean_token_accuracy": 0.7041126251220703, + "num_tokens": 229961720.0, + "step": 93740 + }, + { + "epoch": 0.8595397451178143, + "learning_rate": 2.8093884661226738e-05, + "loss": 0.9628, + "mean_token_accuracy": 0.707321721315384, + "num_tokens": 229991875.0, + "step": 93750 + }, + { + "epoch": 0.8596314293572935, + "learning_rate": 2.807554781333089e-05, + "loss": 1.0085, + "mean_token_accuracy": 0.6946305811405182, + "num_tokens": 230022718.0, + "step": 93760 + }, + { + "epoch": 0.8597231135967727, + "learning_rate": 2.8057210965435045e-05, + "loss": 1.0083, + "mean_token_accuracy": 0.7017239272594452, + "num_tokens": 230052335.0, + "step": 93770 + }, + { + "epoch": 0.8598147978362519, + "learning_rate": 2.80388741175392e-05, + "loss": 1.0019, + "mean_token_accuracy": 0.6990306317806244, + "num_tokens": 230080329.0, + "step": 93780 + }, + { + "epoch": 0.8599064820757312, + "learning_rate": 2.802053726964335e-05, + "loss": 0.9721, + "mean_token_accuracy": 0.7119702637195587, + "num_tokens": 230109908.0, + "step": 93790 + }, + { + "epoch": 0.8599981663152104, + "learning_rate": 2.8002200421747504e-05, + "loss": 0.9931, + "mean_token_accuracy": 0.7025001227855683, + "num_tokens": 230140443.0, + "step": 93800 + }, + { + "epoch": 0.8600898505546897, + "learning_rate": 2.7983863573851656e-05, + "loss": 1.0093, + "mean_token_accuracy": 0.7040551781654358, + "num_tokens": 230170316.0, + "step": 93810 + }, + { + "epoch": 0.8601815347941689, + "learning_rate": 2.796552672595581e-05, + "loss": 0.9965, + "mean_token_accuracy": 0.7011925458908081, + "num_tokens": 230200380.0, + "step": 93820 + }, + { + "epoch": 0.8602732190336481, + "learning_rate": 2.7947189878059966e-05, + "loss": 0.992, + "mean_token_accuracy": 0.7017391383647918, + "num_tokens": 230230488.0, + "step": 93830 + }, + { + "epoch": 0.8603649032731273, + "learning_rate": 2.7928853030164115e-05, + "loss": 0.978, + "mean_token_accuracy": 0.7033119022846221, + "num_tokens": 230258354.0, + "step": 93840 + }, + { + "epoch": 0.8604565875126066, + "learning_rate": 2.791051618226827e-05, + "loss": 0.9922, + "mean_token_accuracy": 0.7034036040306091, + "num_tokens": 230288543.0, + "step": 93850 + }, + { + "epoch": 0.8605482717520858, + "learning_rate": 2.7892179334372422e-05, + "loss": 0.9878, + "mean_token_accuracy": 0.7018364071846008, + "num_tokens": 230319075.0, + "step": 93860 + }, + { + "epoch": 0.8606399559915651, + "learning_rate": 2.7873842486476577e-05, + "loss": 0.9814, + "mean_token_accuracy": 0.7068473875522614, + "num_tokens": 230349285.0, + "step": 93870 + }, + { + "epoch": 0.8607316402310443, + "learning_rate": 2.7855505638580732e-05, + "loss": 1.0028, + "mean_token_accuracy": 0.6989137411117554, + "num_tokens": 230379656.0, + "step": 93880 + }, + { + "epoch": 0.8608233244705236, + "learning_rate": 2.783716879068488e-05, + "loss": 0.9928, + "mean_token_accuracy": 0.698908656835556, + "num_tokens": 230410080.0, + "step": 93890 + }, + { + "epoch": 0.8609150087100027, + "learning_rate": 2.7818831942789036e-05, + "loss": 0.9962, + "mean_token_accuracy": 0.7035494387149811, + "num_tokens": 230438196.0, + "step": 93900 + }, + { + "epoch": 0.861006692949482, + "learning_rate": 2.780049509489319e-05, + "loss": 1.0011, + "mean_token_accuracy": 0.7058464050292969, + "num_tokens": 230468924.0, + "step": 93910 + }, + { + "epoch": 0.8610983771889612, + "learning_rate": 2.7782158246997343e-05, + "loss": 0.998, + "mean_token_accuracy": 0.702565610408783, + "num_tokens": 230499205.0, + "step": 93920 + }, + { + "epoch": 0.8611900614284405, + "learning_rate": 2.77638213991015e-05, + "loss": 0.973, + "mean_token_accuracy": 0.706601870059967, + "num_tokens": 230528770.0, + "step": 93930 + }, + { + "epoch": 0.8612817456679197, + "learning_rate": 2.7745484551205647e-05, + "loss": 1.0087, + "mean_token_accuracy": 0.6979085981845856, + "num_tokens": 230559888.0, + "step": 93940 + }, + { + "epoch": 0.861373429907399, + "learning_rate": 2.7727147703309802e-05, + "loss": 1.0179, + "mean_token_accuracy": 0.6932749927043915, + "num_tokens": 230589187.0, + "step": 93950 + }, + { + "epoch": 0.8614651141468781, + "learning_rate": 2.7708810855413958e-05, + "loss": 0.9798, + "mean_token_accuracy": 0.7050952792167664, + "num_tokens": 230616591.0, + "step": 93960 + }, + { + "epoch": 0.8615567983863573, + "learning_rate": 2.769047400751811e-05, + "loss": 0.967, + "mean_token_accuracy": 0.7060283780097961, + "num_tokens": 230646084.0, + "step": 93970 + }, + { + "epoch": 0.8616484826258366, + "learning_rate": 2.7672137159622265e-05, + "loss": 0.969, + "mean_token_accuracy": 0.7095028698444367, + "num_tokens": 230674694.0, + "step": 93980 + }, + { + "epoch": 0.8617401668653158, + "learning_rate": 2.7653800311726413e-05, + "loss": 0.9702, + "mean_token_accuracy": 0.705646425485611, + "num_tokens": 230705039.0, + "step": 93990 + }, + { + "epoch": 0.8618318511047951, + "learning_rate": 2.763546346383057e-05, + "loss": 1.002, + "mean_token_accuracy": 0.7054389953613281, + "num_tokens": 230735426.0, + "step": 94000 + }, + { + "epoch": 0.8619235353442743, + "learning_rate": 2.7617126615934724e-05, + "loss": 1.0114, + "mean_token_accuracy": 0.6922630369663239, + "num_tokens": 230764606.0, + "step": 94010 + }, + { + "epoch": 0.8620152195837536, + "learning_rate": 2.7598789768038876e-05, + "loss": 0.954, + "mean_token_accuracy": 0.7118881821632386, + "num_tokens": 230792909.0, + "step": 94020 + }, + { + "epoch": 0.8621069038232327, + "learning_rate": 2.758045292014303e-05, + "loss": 0.9866, + "mean_token_accuracy": 0.7054672062397003, + "num_tokens": 230822743.0, + "step": 94030 + }, + { + "epoch": 0.862198588062712, + "learning_rate": 2.756211607224718e-05, + "loss": 0.9656, + "mean_token_accuracy": 0.7076707184314728, + "num_tokens": 230852177.0, + "step": 94040 + }, + { + "epoch": 0.8622902723021912, + "learning_rate": 2.7543779224351334e-05, + "loss": 0.9814, + "mean_token_accuracy": 0.7012471199035645, + "num_tokens": 230881719.0, + "step": 94050 + }, + { + "epoch": 0.8623819565416705, + "learning_rate": 2.752544237645549e-05, + "loss": 1.0074, + "mean_token_accuracy": 0.7048568487167358, + "num_tokens": 230912558.0, + "step": 94060 + }, + { + "epoch": 0.8624736407811497, + "learning_rate": 2.750710552855964e-05, + "loss": 1.0192, + "mean_token_accuracy": 0.6959864974021912, + "num_tokens": 230942152.0, + "step": 94070 + }, + { + "epoch": 0.862565325020629, + "learning_rate": 2.7488768680663797e-05, + "loss": 1.0034, + "mean_token_accuracy": 0.6967722237110138, + "num_tokens": 230970808.0, + "step": 94080 + }, + { + "epoch": 0.8626570092601082, + "learning_rate": 2.7470431832767952e-05, + "loss": 0.9748, + "mean_token_accuracy": 0.707591074705124, + "num_tokens": 231000175.0, + "step": 94090 + }, + { + "epoch": 0.8627486934995874, + "learning_rate": 2.74520949848721e-05, + "loss": 0.9897, + "mean_token_accuracy": 0.7098795533180237, + "num_tokens": 231029227.0, + "step": 94100 + }, + { + "epoch": 0.8628403777390666, + "learning_rate": 2.7433758136976256e-05, + "loss": 1.006, + "mean_token_accuracy": 0.7012426614761352, + "num_tokens": 231059404.0, + "step": 94110 + }, + { + "epoch": 0.8629320619785459, + "learning_rate": 2.7415421289080408e-05, + "loss": 1.0141, + "mean_token_accuracy": 0.6978681802749633, + "num_tokens": 231089996.0, + "step": 94120 + }, + { + "epoch": 0.8630237462180251, + "learning_rate": 2.7397084441184563e-05, + "loss": 0.9544, + "mean_token_accuracy": 0.7131826937198639, + "num_tokens": 231119730.0, + "step": 94130 + }, + { + "epoch": 0.8631154304575044, + "learning_rate": 2.7378747593288718e-05, + "loss": 0.984, + "mean_token_accuracy": 0.7006629467010498, + "num_tokens": 231146825.0, + "step": 94140 + }, + { + "epoch": 0.8632071146969836, + "learning_rate": 2.7360410745392867e-05, + "loss": 0.9961, + "mean_token_accuracy": 0.6985842466354371, + "num_tokens": 231177431.0, + "step": 94150 + }, + { + "epoch": 0.8632987989364628, + "learning_rate": 2.7342073897497022e-05, + "loss": 1.0247, + "mean_token_accuracy": 0.6996906638145447, + "num_tokens": 231207506.0, + "step": 94160 + }, + { + "epoch": 0.863390483175942, + "learning_rate": 2.7323737049601174e-05, + "loss": 0.9896, + "mean_token_accuracy": 0.7020743370056153, + "num_tokens": 231236608.0, + "step": 94170 + }, + { + "epoch": 0.8634821674154213, + "learning_rate": 2.730540020170533e-05, + "loss": 1.0192, + "mean_token_accuracy": 0.699338161945343, + "num_tokens": 231266722.0, + "step": 94180 + }, + { + "epoch": 0.8635738516549005, + "learning_rate": 2.7287063353809484e-05, + "loss": 0.9814, + "mean_token_accuracy": 0.6987640619277954, + "num_tokens": 231296180.0, + "step": 94190 + }, + { + "epoch": 0.8636655358943798, + "learning_rate": 2.7268726505913633e-05, + "loss": 0.9644, + "mean_token_accuracy": 0.710695606470108, + "num_tokens": 231324156.0, + "step": 94200 + }, + { + "epoch": 0.863757220133859, + "learning_rate": 2.7250389658017788e-05, + "loss": 0.977, + "mean_token_accuracy": 0.7077572464942932, + "num_tokens": 231355039.0, + "step": 94210 + }, + { + "epoch": 0.8638489043733383, + "learning_rate": 2.7232052810121943e-05, + "loss": 0.9703, + "mean_token_accuracy": 0.7070972979068756, + "num_tokens": 231384375.0, + "step": 94220 + }, + { + "epoch": 0.8639405886128174, + "learning_rate": 2.7213715962226095e-05, + "loss": 0.9995, + "mean_token_accuracy": 0.7043955206871033, + "num_tokens": 231413825.0, + "step": 94230 + }, + { + "epoch": 0.8640322728522967, + "learning_rate": 2.719537911433025e-05, + "loss": 0.9708, + "mean_token_accuracy": 0.7065513074398041, + "num_tokens": 231443164.0, + "step": 94240 + }, + { + "epoch": 0.8641239570917759, + "learning_rate": 2.71770422664344e-05, + "loss": 1.0008, + "mean_token_accuracy": 0.7002853393554688, + "num_tokens": 231473461.0, + "step": 94250 + }, + { + "epoch": 0.8642156413312552, + "learning_rate": 2.7158705418538554e-05, + "loss": 0.9558, + "mean_token_accuracy": 0.7069169521331787, + "num_tokens": 231501040.0, + "step": 94260 + }, + { + "epoch": 0.8643073255707344, + "learning_rate": 2.714036857064271e-05, + "loss": 0.9944, + "mean_token_accuracy": 0.7037984371185303, + "num_tokens": 231531327.0, + "step": 94270 + }, + { + "epoch": 0.8643990098102137, + "learning_rate": 2.712203172274686e-05, + "loss": 1.0082, + "mean_token_accuracy": 0.7028061032295227, + "num_tokens": 231560377.0, + "step": 94280 + }, + { + "epoch": 0.8644906940496928, + "learning_rate": 2.7103694874851017e-05, + "loss": 0.9888, + "mean_token_accuracy": 0.7046666860580444, + "num_tokens": 231589614.0, + "step": 94290 + }, + { + "epoch": 0.8645823782891721, + "learning_rate": 2.7085358026955165e-05, + "loss": 0.9998, + "mean_token_accuracy": 0.700808972120285, + "num_tokens": 231618458.0, + "step": 94300 + }, + { + "epoch": 0.8646740625286513, + "learning_rate": 2.706702117905932e-05, + "loss": 0.99, + "mean_token_accuracy": 0.7057264983654022, + "num_tokens": 231649163.0, + "step": 94310 + }, + { + "epoch": 0.8647657467681306, + "learning_rate": 2.7048684331163476e-05, + "loss": 0.9561, + "mean_token_accuracy": 0.7108542919158936, + "num_tokens": 231676889.0, + "step": 94320 + }, + { + "epoch": 0.8648574310076098, + "learning_rate": 2.7030347483267627e-05, + "loss": 1.0102, + "mean_token_accuracy": 0.6991156876087189, + "num_tokens": 231706959.0, + "step": 94330 + }, + { + "epoch": 0.8649491152470891, + "learning_rate": 2.7012010635371783e-05, + "loss": 0.9949, + "mean_token_accuracy": 0.7035431027412414, + "num_tokens": 231736139.0, + "step": 94340 + }, + { + "epoch": 0.8650407994865683, + "learning_rate": 2.699367378747593e-05, + "loss": 0.966, + "mean_token_accuracy": 0.7110806465148926, + "num_tokens": 231765629.0, + "step": 94350 + }, + { + "epoch": 0.8651324837260475, + "learning_rate": 2.6975336939580086e-05, + "loss": 0.99, + "mean_token_accuracy": 0.7026050984859467, + "num_tokens": 231795445.0, + "step": 94360 + }, + { + "epoch": 0.8652241679655267, + "learning_rate": 2.695700009168424e-05, + "loss": 0.9915, + "mean_token_accuracy": 0.7057330727577209, + "num_tokens": 231824756.0, + "step": 94370 + }, + { + "epoch": 0.865315852205006, + "learning_rate": 2.6938663243788394e-05, + "loss": 0.9787, + "mean_token_accuracy": 0.7037960708141326, + "num_tokens": 231852294.0, + "step": 94380 + }, + { + "epoch": 0.8654075364444852, + "learning_rate": 2.692032639589255e-05, + "loss": 0.9734, + "mean_token_accuracy": 0.7058798670768738, + "num_tokens": 231881665.0, + "step": 94390 + }, + { + "epoch": 0.8654992206839645, + "learning_rate": 2.6901989547996704e-05, + "loss": 1.0152, + "mean_token_accuracy": 0.6974703252315522, + "num_tokens": 231911070.0, + "step": 94400 + }, + { + "epoch": 0.8655909049234437, + "learning_rate": 2.6883652700100853e-05, + "loss": 0.984, + "mean_token_accuracy": 0.7004394233226776, + "num_tokens": 231940680.0, + "step": 94410 + }, + { + "epoch": 0.8656825891629228, + "learning_rate": 2.6865315852205008e-05, + "loss": 0.9946, + "mean_token_accuracy": 0.7020886182785034, + "num_tokens": 231969937.0, + "step": 94420 + }, + { + "epoch": 0.8657742734024021, + "learning_rate": 2.684697900430916e-05, + "loss": 1.0296, + "mean_token_accuracy": 0.694058620929718, + "num_tokens": 231998670.0, + "step": 94430 + }, + { + "epoch": 0.8658659576418813, + "learning_rate": 2.6828642156413315e-05, + "loss": 1.0034, + "mean_token_accuracy": 0.6922867357730865, + "num_tokens": 232026165.0, + "step": 94440 + }, + { + "epoch": 0.8659576418813606, + "learning_rate": 2.681030530851747e-05, + "loss": 1.0265, + "mean_token_accuracy": 0.6965956032276154, + "num_tokens": 232056410.0, + "step": 94450 + }, + { + "epoch": 0.8660493261208398, + "learning_rate": 2.679196846062162e-05, + "loss": 0.999, + "mean_token_accuracy": 0.7027850270271301, + "num_tokens": 232086808.0, + "step": 94460 + }, + { + "epoch": 0.8661410103603191, + "learning_rate": 2.6773631612725774e-05, + "loss": 0.978, + "mean_token_accuracy": 0.7054557502269745, + "num_tokens": 232115545.0, + "step": 94470 + }, + { + "epoch": 0.8662326945997983, + "learning_rate": 2.6755294764829926e-05, + "loss": 0.9514, + "mean_token_accuracy": 0.7109884262084961, + "num_tokens": 232145307.0, + "step": 94480 + }, + { + "epoch": 0.8663243788392775, + "learning_rate": 2.673695791693408e-05, + "loss": 0.9716, + "mean_token_accuracy": 0.7080773949623108, + "num_tokens": 232174173.0, + "step": 94490 + }, + { + "epoch": 0.8664160630787567, + "learning_rate": 2.6718621069038236e-05, + "loss": 0.9585, + "mean_token_accuracy": 0.7067557334899902, + "num_tokens": 232202027.0, + "step": 94500 + }, + { + "epoch": 0.866507747318236, + "learning_rate": 2.6700284221142385e-05, + "loss": 0.9805, + "mean_token_accuracy": 0.7113572180271148, + "num_tokens": 232232278.0, + "step": 94510 + }, + { + "epoch": 0.8665994315577152, + "learning_rate": 2.668194737324654e-05, + "loss": 0.9828, + "mean_token_accuracy": 0.7049754381179809, + "num_tokens": 232261493.0, + "step": 94520 + }, + { + "epoch": 0.8666911157971945, + "learning_rate": 2.6663610525350695e-05, + "loss": 0.9949, + "mean_token_accuracy": 0.7011536180973053, + "num_tokens": 232290512.0, + "step": 94530 + }, + { + "epoch": 0.8667828000366737, + "learning_rate": 2.6645273677454847e-05, + "loss": 1.0086, + "mean_token_accuracy": 0.697703379392624, + "num_tokens": 232320930.0, + "step": 94540 + }, + { + "epoch": 0.8668744842761529, + "learning_rate": 2.6626936829559002e-05, + "loss": 0.9921, + "mean_token_accuracy": 0.7040180504322052, + "num_tokens": 232350121.0, + "step": 94550 + }, + { + "epoch": 0.8669661685156321, + "learning_rate": 2.660859998166315e-05, + "loss": 0.9816, + "mean_token_accuracy": 0.7010047674179077, + "num_tokens": 232378606.0, + "step": 94560 + }, + { + "epoch": 0.8670578527551114, + "learning_rate": 2.6590263133767306e-05, + "loss": 1.0194, + "mean_token_accuracy": 0.6984214723110199, + "num_tokens": 232408145.0, + "step": 94570 + }, + { + "epoch": 0.8671495369945906, + "learning_rate": 2.657192628587146e-05, + "loss": 0.9622, + "mean_token_accuracy": 0.7074166297912597, + "num_tokens": 232437784.0, + "step": 94580 + }, + { + "epoch": 0.8672412212340699, + "learning_rate": 2.6553589437975613e-05, + "loss": 0.9427, + "mean_token_accuracy": 0.7127412855625153, + "num_tokens": 232467373.0, + "step": 94590 + }, + { + "epoch": 0.8673329054735491, + "learning_rate": 2.653525259007977e-05, + "loss": 1.0081, + "mean_token_accuracy": 0.6999133467674256, + "num_tokens": 232496390.0, + "step": 94600 + }, + { + "epoch": 0.8674245897130284, + "learning_rate": 2.6516915742183917e-05, + "loss": 0.998, + "mean_token_accuracy": 0.7039475798606872, + "num_tokens": 232525541.0, + "step": 94610 + }, + { + "epoch": 0.8675162739525075, + "learning_rate": 2.6498578894288072e-05, + "loss": 0.9571, + "mean_token_accuracy": 0.7070056378841401, + "num_tokens": 232554456.0, + "step": 94620 + }, + { + "epoch": 0.8676079581919868, + "learning_rate": 2.6480242046392228e-05, + "loss": 0.9749, + "mean_token_accuracy": 0.7079532027244568, + "num_tokens": 232583904.0, + "step": 94630 + }, + { + "epoch": 0.867699642431466, + "learning_rate": 2.646190519849638e-05, + "loss": 0.956, + "mean_token_accuracy": 0.7131348252296448, + "num_tokens": 232613638.0, + "step": 94640 + }, + { + "epoch": 0.8677913266709453, + "learning_rate": 2.6443568350600535e-05, + "loss": 0.9597, + "mean_token_accuracy": 0.7060459673404693, + "num_tokens": 232642199.0, + "step": 94650 + }, + { + "epoch": 0.8678830109104245, + "learning_rate": 2.6425231502704683e-05, + "loss": 0.9639, + "mean_token_accuracy": 0.7111473381519318, + "num_tokens": 232670925.0, + "step": 94660 + }, + { + "epoch": 0.8679746951499038, + "learning_rate": 2.640689465480884e-05, + "loss": 0.9892, + "mean_token_accuracy": 0.7017959654331207, + "num_tokens": 232699820.0, + "step": 94670 + }, + { + "epoch": 0.8680663793893829, + "learning_rate": 2.6388557806912994e-05, + "loss": 0.9897, + "mean_token_accuracy": 0.7052757978439331, + "num_tokens": 232728175.0, + "step": 94680 + }, + { + "epoch": 0.8681580636288622, + "learning_rate": 2.6370220959017145e-05, + "loss": 0.9394, + "mean_token_accuracy": 0.7146795988082886, + "num_tokens": 232756588.0, + "step": 94690 + }, + { + "epoch": 0.8682497478683414, + "learning_rate": 2.63518841111213e-05, + "loss": 0.9949, + "mean_token_accuracy": 0.6988874673843384, + "num_tokens": 232785942.0, + "step": 94700 + }, + { + "epoch": 0.8683414321078207, + "learning_rate": 2.6333547263225456e-05, + "loss": 0.9749, + "mean_token_accuracy": 0.7053543865680695, + "num_tokens": 232814163.0, + "step": 94710 + }, + { + "epoch": 0.8684331163472999, + "learning_rate": 2.6315210415329604e-05, + "loss": 1.0181, + "mean_token_accuracy": 0.6953714549541473, + "num_tokens": 232843536.0, + "step": 94720 + }, + { + "epoch": 0.8685248005867792, + "learning_rate": 2.629687356743376e-05, + "loss": 0.9833, + "mean_token_accuracy": 0.7034175992012024, + "num_tokens": 232872725.0, + "step": 94730 + }, + { + "epoch": 0.8686164848262584, + "learning_rate": 2.627853671953791e-05, + "loss": 0.9623, + "mean_token_accuracy": 0.7084377586841584, + "num_tokens": 232899619.0, + "step": 94740 + }, + { + "epoch": 0.8687081690657376, + "learning_rate": 2.6260199871642067e-05, + "loss": 0.9837, + "mean_token_accuracy": 0.7027204811573029, + "num_tokens": 232929152.0, + "step": 94750 + }, + { + "epoch": 0.8687998533052168, + "learning_rate": 2.6241863023746222e-05, + "loss": 1.0264, + "mean_token_accuracy": 0.6943724989891052, + "num_tokens": 232958774.0, + "step": 94760 + }, + { + "epoch": 0.8688915375446961, + "learning_rate": 2.622352617585037e-05, + "loss": 0.9549, + "mean_token_accuracy": 0.7107896268367767, + "num_tokens": 232987364.0, + "step": 94770 + }, + { + "epoch": 0.8689832217841753, + "learning_rate": 2.6205189327954526e-05, + "loss": 0.9701, + "mean_token_accuracy": 0.7117876529693603, + "num_tokens": 233015145.0, + "step": 94780 + }, + { + "epoch": 0.8690749060236546, + "learning_rate": 2.6186852480058678e-05, + "loss": 0.9652, + "mean_token_accuracy": 0.7065112113952636, + "num_tokens": 233043891.0, + "step": 94790 + }, + { + "epoch": 0.8691665902631338, + "learning_rate": 2.6168515632162833e-05, + "loss": 0.9754, + "mean_token_accuracy": 0.7085714340209961, + "num_tokens": 233071931.0, + "step": 94800 + }, + { + "epoch": 0.869258274502613, + "learning_rate": 2.6150178784266988e-05, + "loss": 0.996, + "mean_token_accuracy": 0.702934467792511, + "num_tokens": 233101663.0, + "step": 94810 + }, + { + "epoch": 0.8693499587420922, + "learning_rate": 2.6131841936371137e-05, + "loss": 0.9667, + "mean_token_accuracy": 0.704881340265274, + "num_tokens": 233130016.0, + "step": 94820 + }, + { + "epoch": 0.8694416429815714, + "learning_rate": 2.6113505088475292e-05, + "loss": 0.99, + "mean_token_accuracy": 0.7008226096630097, + "num_tokens": 233158300.0, + "step": 94830 + }, + { + "epoch": 0.8695333272210507, + "learning_rate": 2.6095168240579444e-05, + "loss": 1.0013, + "mean_token_accuracy": 0.701530122756958, + "num_tokens": 233188440.0, + "step": 94840 + }, + { + "epoch": 0.86962501146053, + "learning_rate": 2.60768313926836e-05, + "loss": 0.9663, + "mean_token_accuracy": 0.7130723536014557, + "num_tokens": 233218179.0, + "step": 94850 + }, + { + "epoch": 0.8697166957000092, + "learning_rate": 2.6058494544787754e-05, + "loss": 1.0023, + "mean_token_accuracy": 0.6981267809867859, + "num_tokens": 233246321.0, + "step": 94860 + }, + { + "epoch": 0.8698083799394885, + "learning_rate": 2.6040157696891903e-05, + "loss": 0.9526, + "mean_token_accuracy": 0.7105185151100158, + "num_tokens": 233275232.0, + "step": 94870 + }, + { + "epoch": 0.8699000641789676, + "learning_rate": 2.6021820848996058e-05, + "loss": 0.9756, + "mean_token_accuracy": 0.7113110899925232, + "num_tokens": 233302680.0, + "step": 94880 + }, + { + "epoch": 0.8699917484184468, + "learning_rate": 2.6003484001100213e-05, + "loss": 0.9531, + "mean_token_accuracy": 0.7159253478050231, + "num_tokens": 233331749.0, + "step": 94890 + }, + { + "epoch": 0.8700834326579261, + "learning_rate": 2.5985147153204365e-05, + "loss": 0.9449, + "mean_token_accuracy": 0.7144491136074066, + "num_tokens": 233360578.0, + "step": 94900 + }, + { + "epoch": 0.8701751168974053, + "learning_rate": 2.596681030530852e-05, + "loss": 0.9573, + "mean_token_accuracy": 0.7086441040039062, + "num_tokens": 233389492.0, + "step": 94910 + }, + { + "epoch": 0.8702668011368846, + "learning_rate": 2.594847345741267e-05, + "loss": 0.9643, + "mean_token_accuracy": 0.7050327181816101, + "num_tokens": 233417646.0, + "step": 94920 + }, + { + "epoch": 0.8703584853763638, + "learning_rate": 2.5930136609516824e-05, + "loss": 0.9746, + "mean_token_accuracy": 0.7074222266674042, + "num_tokens": 233445439.0, + "step": 94930 + }, + { + "epoch": 0.870450169615843, + "learning_rate": 2.591179976162098e-05, + "loss": 0.9242, + "mean_token_accuracy": 0.7211675465106964, + "num_tokens": 233473966.0, + "step": 94940 + }, + { + "epoch": 0.8705418538553222, + "learning_rate": 2.589346291372513e-05, + "loss": 0.9854, + "mean_token_accuracy": 0.7037066578865051, + "num_tokens": 233502820.0, + "step": 94950 + }, + { + "epoch": 0.8706335380948015, + "learning_rate": 2.5875126065829287e-05, + "loss": 0.9972, + "mean_token_accuracy": 0.7012357950210572, + "num_tokens": 233530257.0, + "step": 94960 + }, + { + "epoch": 0.8707252223342807, + "learning_rate": 2.5856789217933435e-05, + "loss": 0.9663, + "mean_token_accuracy": 0.7035387933254242, + "num_tokens": 233560472.0, + "step": 94970 + }, + { + "epoch": 0.87081690657376, + "learning_rate": 2.583845237003759e-05, + "loss": 0.9637, + "mean_token_accuracy": 0.708971232175827, + "num_tokens": 233588403.0, + "step": 94980 + }, + { + "epoch": 0.8709085908132392, + "learning_rate": 2.5820115522141746e-05, + "loss": 1.0025, + "mean_token_accuracy": 0.7040158629417419, + "num_tokens": 233615823.0, + "step": 94990 + }, + { + "epoch": 0.8710002750527185, + "learning_rate": 2.5801778674245897e-05, + "loss": 0.9713, + "mean_token_accuracy": 0.7070195496082305, + "num_tokens": 233645321.0, + "step": 95000 + }, + { + "epoch": 0.8710919592921976, + "learning_rate": 2.5783441826350053e-05, + "loss": 0.9863, + "mean_token_accuracy": 0.7015394985675811, + "num_tokens": 233675199.0, + "step": 95010 + }, + { + "epoch": 0.8711836435316769, + "learning_rate": 2.5765104978454208e-05, + "loss": 0.9805, + "mean_token_accuracy": 0.7036999762058258, + "num_tokens": 233703256.0, + "step": 95020 + }, + { + "epoch": 0.8712753277711561, + "learning_rate": 2.5746768130558356e-05, + "loss": 0.9551, + "mean_token_accuracy": 0.7102802157402038, + "num_tokens": 233732170.0, + "step": 95030 + }, + { + "epoch": 0.8713670120106354, + "learning_rate": 2.572843128266251e-05, + "loss": 0.9677, + "mean_token_accuracy": 0.7078596889972687, + "num_tokens": 233760230.0, + "step": 95040 + }, + { + "epoch": 0.8714586962501146, + "learning_rate": 2.5710094434766664e-05, + "loss": 0.9759, + "mean_token_accuracy": 0.7082966566085815, + "num_tokens": 233789705.0, + "step": 95050 + }, + { + "epoch": 0.8715503804895939, + "learning_rate": 2.569175758687082e-05, + "loss": 0.9796, + "mean_token_accuracy": 0.703370201587677, + "num_tokens": 233817490.0, + "step": 95060 + }, + { + "epoch": 0.871642064729073, + "learning_rate": 2.5673420738974974e-05, + "loss": 0.9765, + "mean_token_accuracy": 0.7046668887138366, + "num_tokens": 233845745.0, + "step": 95070 + }, + { + "epoch": 0.8717337489685523, + "learning_rate": 2.5655083891079123e-05, + "loss": 0.9799, + "mean_token_accuracy": 0.7063077211380004, + "num_tokens": 233874955.0, + "step": 95080 + }, + { + "epoch": 0.8718254332080315, + "learning_rate": 2.5636747043183278e-05, + "loss": 0.9647, + "mean_token_accuracy": 0.7077544212341309, + "num_tokens": 233902908.0, + "step": 95090 + }, + { + "epoch": 0.8719171174475108, + "learning_rate": 2.561841019528743e-05, + "loss": 0.9876, + "mean_token_accuracy": 0.6998224079608917, + "num_tokens": 233931375.0, + "step": 95100 + }, + { + "epoch": 0.87200880168699, + "learning_rate": 2.5600073347391585e-05, + "loss": 0.9622, + "mean_token_accuracy": 0.7097045123577118, + "num_tokens": 233961956.0, + "step": 95110 + }, + { + "epoch": 0.8721004859264693, + "learning_rate": 2.558173649949574e-05, + "loss": 0.9701, + "mean_token_accuracy": 0.7076535224914551, + "num_tokens": 233990360.0, + "step": 95120 + }, + { + "epoch": 0.8721921701659485, + "learning_rate": 2.556339965159989e-05, + "loss": 0.9746, + "mean_token_accuracy": 0.7034613966941834, + "num_tokens": 234020465.0, + "step": 95130 + }, + { + "epoch": 0.8722838544054277, + "learning_rate": 2.5545062803704044e-05, + "loss": 0.9643, + "mean_token_accuracy": 0.708831250667572, + "num_tokens": 234048471.0, + "step": 95140 + }, + { + "epoch": 0.8723755386449069, + "learning_rate": 2.5526725955808196e-05, + "loss": 1.0, + "mean_token_accuracy": 0.7020787358283996, + "num_tokens": 234077948.0, + "step": 95150 + }, + { + "epoch": 0.8724672228843862, + "learning_rate": 2.550838910791235e-05, + "loss": 0.9822, + "mean_token_accuracy": 0.7070713996887207, + "num_tokens": 234106271.0, + "step": 95160 + }, + { + "epoch": 0.8725589071238654, + "learning_rate": 2.5490052260016506e-05, + "loss": 0.9846, + "mean_token_accuracy": 0.7102813124656677, + "num_tokens": 234134655.0, + "step": 95170 + }, + { + "epoch": 0.8726505913633447, + "learning_rate": 2.5471715412120655e-05, + "loss": 0.9719, + "mean_token_accuracy": 0.7100964784622192, + "num_tokens": 234162795.0, + "step": 95180 + }, + { + "epoch": 0.8727422756028239, + "learning_rate": 2.545337856422481e-05, + "loss": 0.9509, + "mean_token_accuracy": 0.7117873907089234, + "num_tokens": 234192416.0, + "step": 95190 + }, + { + "epoch": 0.872833959842303, + "learning_rate": 2.5435041716328965e-05, + "loss": 0.972, + "mean_token_accuracy": 0.7072008550167084, + "num_tokens": 234221732.0, + "step": 95200 + }, + { + "epoch": 0.8729256440817823, + "learning_rate": 2.5416704868433117e-05, + "loss": 0.9356, + "mean_token_accuracy": 0.7139463067054749, + "num_tokens": 234250512.0, + "step": 95210 + }, + { + "epoch": 0.8730173283212616, + "learning_rate": 2.5398368020537272e-05, + "loss": 0.9465, + "mean_token_accuracy": 0.7087880313396454, + "num_tokens": 234278950.0, + "step": 95220 + }, + { + "epoch": 0.8731090125607408, + "learning_rate": 2.538003117264142e-05, + "loss": 0.9947, + "mean_token_accuracy": 0.6958837747573853, + "num_tokens": 234308344.0, + "step": 95230 + }, + { + "epoch": 0.87320069680022, + "learning_rate": 2.5361694324745576e-05, + "loss": 0.9845, + "mean_token_accuracy": 0.7043018460273742, + "num_tokens": 234337370.0, + "step": 95240 + }, + { + "epoch": 0.8732923810396993, + "learning_rate": 2.534335747684973e-05, + "loss": 0.9475, + "mean_token_accuracy": 0.7157825469970703, + "num_tokens": 234367341.0, + "step": 95250 + }, + { + "epoch": 0.8733840652791786, + "learning_rate": 2.5325020628953883e-05, + "loss": 0.9805, + "mean_token_accuracy": 0.7008367896080017, + "num_tokens": 234396779.0, + "step": 95260 + }, + { + "epoch": 0.8734757495186577, + "learning_rate": 2.530668378105804e-05, + "loss": 0.9728, + "mean_token_accuracy": 0.7053045749664306, + "num_tokens": 234425469.0, + "step": 95270 + }, + { + "epoch": 0.873567433758137, + "learning_rate": 2.5288346933162187e-05, + "loss": 0.9709, + "mean_token_accuracy": 0.7075625956058502, + "num_tokens": 234453451.0, + "step": 95280 + }, + { + "epoch": 0.8736591179976162, + "learning_rate": 2.5270010085266342e-05, + "loss": 0.9498, + "mean_token_accuracy": 0.711888062953949, + "num_tokens": 234480748.0, + "step": 95290 + }, + { + "epoch": 0.8737508022370954, + "learning_rate": 2.5251673237370498e-05, + "loss": 0.9419, + "mean_token_accuracy": 0.7127594470977783, + "num_tokens": 234509115.0, + "step": 95300 + }, + { + "epoch": 0.8738424864765747, + "learning_rate": 2.523333638947465e-05, + "loss": 0.9791, + "mean_token_accuracy": 0.7048508524894714, + "num_tokens": 234537613.0, + "step": 95310 + }, + { + "epoch": 0.873934170716054, + "learning_rate": 2.5214999541578805e-05, + "loss": 0.9787, + "mean_token_accuracy": 0.7064248204231263, + "num_tokens": 234566964.0, + "step": 95320 + }, + { + "epoch": 0.8740258549555332, + "learning_rate": 2.519666269368296e-05, + "loss": 0.9684, + "mean_token_accuracy": 0.7089863121509552, + "num_tokens": 234595953.0, + "step": 95330 + }, + { + "epoch": 0.8741175391950123, + "learning_rate": 2.517832584578711e-05, + "loss": 0.9586, + "mean_token_accuracy": 0.7119853258132934, + "num_tokens": 234624611.0, + "step": 95340 + }, + { + "epoch": 0.8742092234344916, + "learning_rate": 2.5159988997891264e-05, + "loss": 0.9696, + "mean_token_accuracy": 0.7046167969703674, + "num_tokens": 234652585.0, + "step": 95350 + }, + { + "epoch": 0.8743009076739708, + "learning_rate": 2.5141652149995415e-05, + "loss": 0.9918, + "mean_token_accuracy": 0.7043960213661193, + "num_tokens": 234682260.0, + "step": 95360 + }, + { + "epoch": 0.8743925919134501, + "learning_rate": 2.512331530209957e-05, + "loss": 1.0129, + "mean_token_accuracy": 0.6981764316558838, + "num_tokens": 234711641.0, + "step": 95370 + }, + { + "epoch": 0.8744842761529293, + "learning_rate": 2.5104978454203726e-05, + "loss": 0.9632, + "mean_token_accuracy": 0.7097373843193054, + "num_tokens": 234740476.0, + "step": 95380 + }, + { + "epoch": 0.8745759603924086, + "learning_rate": 2.5086641606307874e-05, + "loss": 0.955, + "mean_token_accuracy": 0.7070928752422333, + "num_tokens": 234768921.0, + "step": 95390 + }, + { + "epoch": 0.8746676446318877, + "learning_rate": 2.506830475841203e-05, + "loss": 0.9468, + "mean_token_accuracy": 0.7109356701374054, + "num_tokens": 234796761.0, + "step": 95400 + }, + { + "epoch": 0.874759328871367, + "learning_rate": 2.504996791051618e-05, + "loss": 0.9568, + "mean_token_accuracy": 0.7114959239959717, + "num_tokens": 234825311.0, + "step": 95410 + }, + { + "epoch": 0.8748510131108462, + "learning_rate": 2.5031631062620337e-05, + "loss": 0.9503, + "mean_token_accuracy": 0.7101741313934327, + "num_tokens": 234854479.0, + "step": 95420 + }, + { + "epoch": 0.8749426973503255, + "learning_rate": 2.5013294214724492e-05, + "loss": 1.017, + "mean_token_accuracy": 0.6984456002712249, + "num_tokens": 234884382.0, + "step": 95430 + }, + { + "epoch": 0.8750343815898047, + "learning_rate": 2.4994957366828644e-05, + "loss": 0.9699, + "mean_token_accuracy": 0.7042559802532196, + "num_tokens": 234913271.0, + "step": 95440 + }, + { + "epoch": 0.875126065829284, + "learning_rate": 2.4976620518932796e-05, + "loss": 0.99, + "mean_token_accuracy": 0.7045483469963074, + "num_tokens": 234940914.0, + "step": 95450 + }, + { + "epoch": 0.8752177500687632, + "learning_rate": 2.495828367103695e-05, + "loss": 0.9818, + "mean_token_accuracy": 0.7026433408260345, + "num_tokens": 234968617.0, + "step": 95460 + }, + { + "epoch": 0.8753094343082424, + "learning_rate": 2.4939946823141103e-05, + "loss": 0.9761, + "mean_token_accuracy": 0.7051691889762879, + "num_tokens": 234997132.0, + "step": 95470 + }, + { + "epoch": 0.8754011185477216, + "learning_rate": 2.4921609975245255e-05, + "loss": 1.0013, + "mean_token_accuracy": 0.7004251718521118, + "num_tokens": 235025374.0, + "step": 95480 + }, + { + "epoch": 0.8754928027872009, + "learning_rate": 2.490327312734941e-05, + "loss": 0.9646, + "mean_token_accuracy": 0.7087277770042419, + "num_tokens": 235054127.0, + "step": 95490 + }, + { + "epoch": 0.8755844870266801, + "learning_rate": 2.4884936279453562e-05, + "loss": 0.9766, + "mean_token_accuracy": 0.7062869131565094, + "num_tokens": 235082647.0, + "step": 95500 + }, + { + "epoch": 0.8756761712661594, + "learning_rate": 2.4866599431557717e-05, + "loss": 0.9695, + "mean_token_accuracy": 0.7079085886478425, + "num_tokens": 235110432.0, + "step": 95510 + }, + { + "epoch": 0.8757678555056386, + "learning_rate": 2.484826258366187e-05, + "loss": 0.9696, + "mean_token_accuracy": 0.7054381608963013, + "num_tokens": 235138219.0, + "step": 95520 + }, + { + "epoch": 0.8758595397451178, + "learning_rate": 2.4829925735766024e-05, + "loss": 0.9694, + "mean_token_accuracy": 0.7025360882282257, + "num_tokens": 235166725.0, + "step": 95530 + }, + { + "epoch": 0.875951223984597, + "learning_rate": 2.4811588887870176e-05, + "loss": 0.9833, + "mean_token_accuracy": 0.7031918048858643, + "num_tokens": 235195793.0, + "step": 95540 + }, + { + "epoch": 0.8760429082240763, + "learning_rate": 2.4793252039974328e-05, + "loss": 0.9581, + "mean_token_accuracy": 0.7089531123638153, + "num_tokens": 235225290.0, + "step": 95550 + }, + { + "epoch": 0.8761345924635555, + "learning_rate": 2.4774915192078483e-05, + "loss": 0.9587, + "mean_token_accuracy": 0.7031606495380401, + "num_tokens": 235253050.0, + "step": 95560 + }, + { + "epoch": 0.8762262767030348, + "learning_rate": 2.4756578344182635e-05, + "loss": 0.9654, + "mean_token_accuracy": 0.7063882887363434, + "num_tokens": 235281109.0, + "step": 95570 + }, + { + "epoch": 0.876317960942514, + "learning_rate": 2.473824149628679e-05, + "loss": 0.9746, + "mean_token_accuracy": 0.7035144686698913, + "num_tokens": 235309797.0, + "step": 95580 + }, + { + "epoch": 0.8764096451819933, + "learning_rate": 2.4719904648390942e-05, + "loss": 0.9657, + "mean_token_accuracy": 0.7078938066959382, + "num_tokens": 235338386.0, + "step": 95590 + }, + { + "epoch": 0.8765013294214724, + "learning_rate": 2.4701567800495094e-05, + "loss": 0.9946, + "mean_token_accuracy": 0.6995946943759919, + "num_tokens": 235367347.0, + "step": 95600 + }, + { + "epoch": 0.8765930136609517, + "learning_rate": 2.468323095259925e-05, + "loss": 0.9675, + "mean_token_accuracy": 0.7101439595222473, + "num_tokens": 235396414.0, + "step": 95610 + }, + { + "epoch": 0.8766846979004309, + "learning_rate": 2.4664894104703405e-05, + "loss": 0.9913, + "mean_token_accuracy": 0.6996130347251892, + "num_tokens": 235425276.0, + "step": 95620 + }, + { + "epoch": 0.8767763821399102, + "learning_rate": 2.4646557256807557e-05, + "loss": 0.9742, + "mean_token_accuracy": 0.7068098068237305, + "num_tokens": 235452571.0, + "step": 95630 + }, + { + "epoch": 0.8768680663793894, + "learning_rate": 2.462822040891171e-05, + "loss": 1.0056, + "mean_token_accuracy": 0.700124728679657, + "num_tokens": 235482425.0, + "step": 95640 + }, + { + "epoch": 0.8769597506188687, + "learning_rate": 2.460988356101586e-05, + "loss": 0.9326, + "mean_token_accuracy": 0.7112212598323822, + "num_tokens": 235510113.0, + "step": 95650 + }, + { + "epoch": 0.8770514348583478, + "learning_rate": 2.4591546713120016e-05, + "loss": 0.9737, + "mean_token_accuracy": 0.7041312277317047, + "num_tokens": 235538601.0, + "step": 95660 + }, + { + "epoch": 0.877143119097827, + "learning_rate": 2.457320986522417e-05, + "loss": 0.9726, + "mean_token_accuracy": 0.7038525938987732, + "num_tokens": 235567940.0, + "step": 95670 + }, + { + "epoch": 0.8772348033373063, + "learning_rate": 2.4554873017328323e-05, + "loss": 0.9739, + "mean_token_accuracy": 0.7062692642211914, + "num_tokens": 235597253.0, + "step": 95680 + }, + { + "epoch": 0.8773264875767856, + "learning_rate": 2.4536536169432475e-05, + "loss": 0.9766, + "mean_token_accuracy": 0.7078110098838806, + "num_tokens": 235625708.0, + "step": 95690 + }, + { + "epoch": 0.8774181718162648, + "learning_rate": 2.4518199321536626e-05, + "loss": 0.9599, + "mean_token_accuracy": 0.7113600492477417, + "num_tokens": 235653706.0, + "step": 95700 + }, + { + "epoch": 0.877509856055744, + "learning_rate": 2.449986247364078e-05, + "loss": 0.964, + "mean_token_accuracy": 0.7109102964401245, + "num_tokens": 235681221.0, + "step": 95710 + }, + { + "epoch": 0.8776015402952233, + "learning_rate": 2.4481525625744937e-05, + "loss": 0.9534, + "mean_token_accuracy": 0.7113423347473145, + "num_tokens": 235708927.0, + "step": 95720 + }, + { + "epoch": 0.8776932245347024, + "learning_rate": 2.446318877784909e-05, + "loss": 0.9683, + "mean_token_accuracy": 0.7058891594409943, + "num_tokens": 235737474.0, + "step": 95730 + }, + { + "epoch": 0.8777849087741817, + "learning_rate": 2.444485192995324e-05, + "loss": 0.9834, + "mean_token_accuracy": 0.7096074402332306, + "num_tokens": 235765542.0, + "step": 95740 + }, + { + "epoch": 0.8778765930136609, + "learning_rate": 2.4426515082057396e-05, + "loss": 0.9643, + "mean_token_accuracy": 0.7085775971412659, + "num_tokens": 235794028.0, + "step": 95750 + }, + { + "epoch": 0.8779682772531402, + "learning_rate": 2.4408178234161548e-05, + "loss": 0.9723, + "mean_token_accuracy": 0.7010929107666015, + "num_tokens": 235822112.0, + "step": 95760 + }, + { + "epoch": 0.8780599614926194, + "learning_rate": 2.4389841386265703e-05, + "loss": 0.9543, + "mean_token_accuracy": 0.7064978361129761, + "num_tokens": 235850543.0, + "step": 95770 + }, + { + "epoch": 0.8781516457320987, + "learning_rate": 2.4371504538369855e-05, + "loss": 0.9773, + "mean_token_accuracy": 0.7082438051700592, + "num_tokens": 235879312.0, + "step": 95780 + }, + { + "epoch": 0.8782433299715778, + "learning_rate": 2.4353167690474007e-05, + "loss": 0.9623, + "mean_token_accuracy": 0.710709398984909, + "num_tokens": 235908264.0, + "step": 95790 + }, + { + "epoch": 0.8783350142110571, + "learning_rate": 2.4334830842578162e-05, + "loss": 0.9693, + "mean_token_accuracy": 0.7027275800704956, + "num_tokens": 235937186.0, + "step": 95800 + }, + { + "epoch": 0.8784266984505363, + "learning_rate": 2.4316493994682317e-05, + "loss": 1.0035, + "mean_token_accuracy": 0.6995549619197845, + "num_tokens": 235966037.0, + "step": 95810 + }, + { + "epoch": 0.8785183826900156, + "learning_rate": 2.429815714678647e-05, + "loss": 0.9826, + "mean_token_accuracy": 0.7057016968727112, + "num_tokens": 235993270.0, + "step": 95820 + }, + { + "epoch": 0.8786100669294948, + "learning_rate": 2.427982029889062e-05, + "loss": 0.9874, + "mean_token_accuracy": 0.7001482546329498, + "num_tokens": 236022678.0, + "step": 95830 + }, + { + "epoch": 0.8787017511689741, + "learning_rate": 2.4261483450994776e-05, + "loss": 0.9667, + "mean_token_accuracy": 0.7085700333118439, + "num_tokens": 236050301.0, + "step": 95840 + }, + { + "epoch": 0.8787934354084533, + "learning_rate": 2.4243146603098928e-05, + "loss": 0.9667, + "mean_token_accuracy": 0.7068552613258362, + "num_tokens": 236077861.0, + "step": 95850 + }, + { + "epoch": 0.8788851196479325, + "learning_rate": 2.4224809755203083e-05, + "loss": 0.9695, + "mean_token_accuracy": 0.7068959414958954, + "num_tokens": 236105802.0, + "step": 95860 + }, + { + "epoch": 0.8789768038874117, + "learning_rate": 2.4206472907307235e-05, + "loss": 0.9593, + "mean_token_accuracy": 0.7121960997581482, + "num_tokens": 236134564.0, + "step": 95870 + }, + { + "epoch": 0.879068488126891, + "learning_rate": 2.4188136059411387e-05, + "loss": 0.9654, + "mean_token_accuracy": 0.7062169075012207, + "num_tokens": 236162176.0, + "step": 95880 + }, + { + "epoch": 0.8791601723663702, + "learning_rate": 2.4169799211515542e-05, + "loss": 0.96, + "mean_token_accuracy": 0.7049622416496277, + "num_tokens": 236191137.0, + "step": 95890 + }, + { + "epoch": 0.8792518566058495, + "learning_rate": 2.4151462363619694e-05, + "loss": 0.9617, + "mean_token_accuracy": 0.7068059146404266, + "num_tokens": 236220024.0, + "step": 95900 + }, + { + "epoch": 0.8793435408453287, + "learning_rate": 2.413312551572385e-05, + "loss": 0.9872, + "mean_token_accuracy": 0.6995436012744903, + "num_tokens": 236248522.0, + "step": 95910 + }, + { + "epoch": 0.8794352250848079, + "learning_rate": 2.4114788667828e-05, + "loss": 0.9547, + "mean_token_accuracy": 0.7080778479576111, + "num_tokens": 236277254.0, + "step": 95920 + }, + { + "epoch": 0.8795269093242871, + "learning_rate": 2.4096451819932157e-05, + "loss": 0.9917, + "mean_token_accuracy": 0.6987809240818024, + "num_tokens": 236305947.0, + "step": 95930 + }, + { + "epoch": 0.8796185935637664, + "learning_rate": 2.407811497203631e-05, + "loss": 0.9543, + "mean_token_accuracy": 0.7094142258167266, + "num_tokens": 236334529.0, + "step": 95940 + }, + { + "epoch": 0.8797102778032456, + "learning_rate": 2.405977812414046e-05, + "loss": 0.9831, + "mean_token_accuracy": 0.6997954726219178, + "num_tokens": 236362266.0, + "step": 95950 + }, + { + "epoch": 0.8798019620427249, + "learning_rate": 2.4041441276244616e-05, + "loss": 1.0043, + "mean_token_accuracy": 0.7003909707069397, + "num_tokens": 236390276.0, + "step": 95960 + }, + { + "epoch": 0.8798936462822041, + "learning_rate": 2.4023104428348767e-05, + "loss": 0.9631, + "mean_token_accuracy": 0.7065606951713562, + "num_tokens": 236418401.0, + "step": 95970 + }, + { + "epoch": 0.8799853305216834, + "learning_rate": 2.4004767580452923e-05, + "loss": 0.9725, + "mean_token_accuracy": 0.7057132840156555, + "num_tokens": 236446703.0, + "step": 95980 + }, + { + "epoch": 0.8800770147611625, + "learning_rate": 2.3986430732557075e-05, + "loss": 0.9855, + "mean_token_accuracy": 0.706520426273346, + "num_tokens": 236475330.0, + "step": 95990 + }, + { + "epoch": 0.8801686990006418, + "learning_rate": 2.3968093884661226e-05, + "loss": 0.9699, + "mean_token_accuracy": 0.7042117118835449, + "num_tokens": 236504253.0, + "step": 96000 + }, + { + "epoch": 0.880260383240121, + "learning_rate": 2.3949757036765382e-05, + "loss": 0.9846, + "mean_token_accuracy": 0.7061336159706115, + "num_tokens": 236532302.0, + "step": 96010 + }, + { + "epoch": 0.8803520674796003, + "learning_rate": 2.3931420188869537e-05, + "loss": 0.9829, + "mean_token_accuracy": 0.7032469272613525, + "num_tokens": 236561433.0, + "step": 96020 + }, + { + "epoch": 0.8804437517190795, + "learning_rate": 2.391308334097369e-05, + "loss": 0.9989, + "mean_token_accuracy": 0.6975636303424835, + "num_tokens": 236589528.0, + "step": 96030 + }, + { + "epoch": 0.8805354359585588, + "learning_rate": 2.389474649307784e-05, + "loss": 0.9552, + "mean_token_accuracy": 0.712497740983963, + "num_tokens": 236617946.0, + "step": 96040 + }, + { + "epoch": 0.8806271201980379, + "learning_rate": 2.3876409645181993e-05, + "loss": 0.9513, + "mean_token_accuracy": 0.7090511202812195, + "num_tokens": 236647618.0, + "step": 96050 + }, + { + "epoch": 0.8807188044375172, + "learning_rate": 2.3858072797286148e-05, + "loss": 0.9822, + "mean_token_accuracy": 0.7052377939224244, + "num_tokens": 236675720.0, + "step": 96060 + }, + { + "epoch": 0.8808104886769964, + "learning_rate": 2.3839735949390303e-05, + "loss": 0.9717, + "mean_token_accuracy": 0.7043699324131012, + "num_tokens": 236704286.0, + "step": 96070 + }, + { + "epoch": 0.8809021729164757, + "learning_rate": 2.3821399101494455e-05, + "loss": 0.9718, + "mean_token_accuracy": 0.706047248840332, + "num_tokens": 236732401.0, + "step": 96080 + }, + { + "epoch": 0.8809938571559549, + "learning_rate": 2.3803062253598607e-05, + "loss": 0.9767, + "mean_token_accuracy": 0.7095676183700561, + "num_tokens": 236760944.0, + "step": 96090 + }, + { + "epoch": 0.8810855413954342, + "learning_rate": 2.378472540570276e-05, + "loss": 0.9803, + "mean_token_accuracy": 0.7032656311988831, + "num_tokens": 236789216.0, + "step": 96100 + }, + { + "epoch": 0.8811772256349134, + "learning_rate": 2.3766388557806914e-05, + "loss": 0.9917, + "mean_token_accuracy": 0.7007404029369354, + "num_tokens": 236818347.0, + "step": 96110 + }, + { + "epoch": 0.8812689098743925, + "learning_rate": 2.374805170991107e-05, + "loss": 0.9521, + "mean_token_accuracy": 0.7090234696865082, + "num_tokens": 236846810.0, + "step": 96120 + }, + { + "epoch": 0.8813605941138718, + "learning_rate": 2.372971486201522e-05, + "loss": 0.962, + "mean_token_accuracy": 0.7073679208755493, + "num_tokens": 236875071.0, + "step": 96130 + }, + { + "epoch": 0.881452278353351, + "learning_rate": 2.3711378014119373e-05, + "loss": 0.9451, + "mean_token_accuracy": 0.7103154122829437, + "num_tokens": 236903111.0, + "step": 96140 + }, + { + "epoch": 0.8815439625928303, + "learning_rate": 2.3693041166223528e-05, + "loss": 0.9731, + "mean_token_accuracy": 0.7064365804195404, + "num_tokens": 236931871.0, + "step": 96150 + }, + { + "epoch": 0.8816356468323095, + "learning_rate": 2.367470431832768e-05, + "loss": 0.9943, + "mean_token_accuracy": 0.7025649309158325, + "num_tokens": 236961731.0, + "step": 96160 + }, + { + "epoch": 0.8817273310717888, + "learning_rate": 2.3656367470431835e-05, + "loss": 0.973, + "mean_token_accuracy": 0.7142005324363708, + "num_tokens": 236990347.0, + "step": 96170 + }, + { + "epoch": 0.8818190153112679, + "learning_rate": 2.3638030622535987e-05, + "loss": 0.9471, + "mean_token_accuracy": 0.7102129638195038, + "num_tokens": 237017421.0, + "step": 96180 + }, + { + "epoch": 0.8819106995507472, + "learning_rate": 2.361969377464014e-05, + "loss": 0.9288, + "mean_token_accuracy": 0.721216493844986, + "num_tokens": 237045388.0, + "step": 96190 + }, + { + "epoch": 0.8820023837902264, + "learning_rate": 2.3601356926744294e-05, + "loss": 0.9711, + "mean_token_accuracy": 0.707420414686203, + "num_tokens": 237073012.0, + "step": 96200 + }, + { + "epoch": 0.8820940680297057, + "learning_rate": 2.3583020078848446e-05, + "loss": 0.9903, + "mean_token_accuracy": 0.7036702990531921, + "num_tokens": 237102049.0, + "step": 96210 + }, + { + "epoch": 0.8821857522691849, + "learning_rate": 2.35646832309526e-05, + "loss": 0.9678, + "mean_token_accuracy": 0.7045400202274322, + "num_tokens": 237130406.0, + "step": 96220 + }, + { + "epoch": 0.8822774365086642, + "learning_rate": 2.3546346383056753e-05, + "loss": 0.9807, + "mean_token_accuracy": 0.7066488981246948, + "num_tokens": 237158095.0, + "step": 96230 + }, + { + "epoch": 0.8823691207481434, + "learning_rate": 2.352800953516091e-05, + "loss": 0.9539, + "mean_token_accuracy": 0.7105531454086303, + "num_tokens": 237185653.0, + "step": 96240 + }, + { + "epoch": 0.8824608049876226, + "learning_rate": 2.350967268726506e-05, + "loss": 0.9699, + "mean_token_accuracy": 0.7080231070518493, + "num_tokens": 237214270.0, + "step": 96250 + }, + { + "epoch": 0.8825524892271018, + "learning_rate": 2.3491335839369212e-05, + "loss": 0.9723, + "mean_token_accuracy": 0.7070541739463806, + "num_tokens": 237243048.0, + "step": 96260 + }, + { + "epoch": 0.8826441734665811, + "learning_rate": 2.3472998991473368e-05, + "loss": 0.983, + "mean_token_accuracy": 0.7049121856689453, + "num_tokens": 237271063.0, + "step": 96270 + }, + { + "epoch": 0.8827358577060603, + "learning_rate": 2.345466214357752e-05, + "loss": 0.9831, + "mean_token_accuracy": 0.7061281263828277, + "num_tokens": 237299560.0, + "step": 96280 + }, + { + "epoch": 0.8828275419455396, + "learning_rate": 2.3436325295681675e-05, + "loss": 0.9732, + "mean_token_accuracy": 0.7040581047534943, + "num_tokens": 237328309.0, + "step": 96290 + }, + { + "epoch": 0.8829192261850188, + "learning_rate": 2.3417988447785827e-05, + "loss": 0.9618, + "mean_token_accuracy": 0.7013525426387787, + "num_tokens": 237356287.0, + "step": 96300 + }, + { + "epoch": 0.883010910424498, + "learning_rate": 2.339965159988998e-05, + "loss": 0.965, + "mean_token_accuracy": 0.7045096695423126, + "num_tokens": 237385418.0, + "step": 96310 + }, + { + "epoch": 0.8831025946639772, + "learning_rate": 2.3381314751994134e-05, + "loss": 0.9748, + "mean_token_accuracy": 0.702563327550888, + "num_tokens": 237413924.0, + "step": 96320 + }, + { + "epoch": 0.8831942789034565, + "learning_rate": 2.336297790409829e-05, + "loss": 0.9521, + "mean_token_accuracy": 0.7084671258926392, + "num_tokens": 237441379.0, + "step": 96330 + }, + { + "epoch": 0.8832859631429357, + "learning_rate": 2.334464105620244e-05, + "loss": 0.9728, + "mean_token_accuracy": 0.7088446319103241, + "num_tokens": 237469444.0, + "step": 96340 + }, + { + "epoch": 0.883377647382415, + "learning_rate": 2.3326304208306593e-05, + "loss": 0.9826, + "mean_token_accuracy": 0.7064197480678558, + "num_tokens": 237498444.0, + "step": 96350 + }, + { + "epoch": 0.8834693316218942, + "learning_rate": 2.3307967360410745e-05, + "loss": 0.9819, + "mean_token_accuracy": 0.7058658063411712, + "num_tokens": 237526235.0, + "step": 96360 + }, + { + "epoch": 0.8835610158613735, + "learning_rate": 2.32896305125149e-05, + "loss": 0.9749, + "mean_token_accuracy": 0.7051710247993469, + "num_tokens": 237554660.0, + "step": 96370 + }, + { + "epoch": 0.8836527001008526, + "learning_rate": 2.3271293664619055e-05, + "loss": 0.9958, + "mean_token_accuracy": 0.7004640519618988, + "num_tokens": 237583348.0, + "step": 96380 + }, + { + "epoch": 0.8837443843403319, + "learning_rate": 2.3252956816723207e-05, + "loss": 0.9699, + "mean_token_accuracy": 0.7076722145080566, + "num_tokens": 237611774.0, + "step": 96390 + }, + { + "epoch": 0.8838360685798111, + "learning_rate": 2.323461996882736e-05, + "loss": 0.9714, + "mean_token_accuracy": 0.7071040511131287, + "num_tokens": 237640235.0, + "step": 96400 + }, + { + "epoch": 0.8839277528192904, + "learning_rate": 2.321628312093151e-05, + "loss": 0.9497, + "mean_token_accuracy": 0.7125555276870728, + "num_tokens": 237669710.0, + "step": 96410 + }, + { + "epoch": 0.8840194370587696, + "learning_rate": 2.3197946273035666e-05, + "loss": 0.9396, + "mean_token_accuracy": 0.7129753589630127, + "num_tokens": 237697698.0, + "step": 96420 + }, + { + "epoch": 0.8841111212982489, + "learning_rate": 2.317960942513982e-05, + "loss": 1.0042, + "mean_token_accuracy": 0.7032662093639374, + "num_tokens": 237726235.0, + "step": 96430 + }, + { + "epoch": 0.884202805537728, + "learning_rate": 2.3161272577243973e-05, + "loss": 0.9517, + "mean_token_accuracy": 0.7114958107471466, + "num_tokens": 237754077.0, + "step": 96440 + }, + { + "epoch": 0.8842944897772073, + "learning_rate": 2.3142935729348125e-05, + "loss": 0.9631, + "mean_token_accuracy": 0.7093418061733245, + "num_tokens": 237782454.0, + "step": 96450 + }, + { + "epoch": 0.8843861740166865, + "learning_rate": 2.312459888145228e-05, + "loss": 0.9837, + "mean_token_accuracy": 0.7035586893558502, + "num_tokens": 237810900.0, + "step": 96460 + }, + { + "epoch": 0.8844778582561658, + "learning_rate": 2.3106262033556432e-05, + "loss": 0.9725, + "mean_token_accuracy": 0.7076469600200653, + "num_tokens": 237839366.0, + "step": 96470 + }, + { + "epoch": 0.884569542495645, + "learning_rate": 2.3087925185660587e-05, + "loss": 0.9594, + "mean_token_accuracy": 0.7062601745128632, + "num_tokens": 237867267.0, + "step": 96480 + }, + { + "epoch": 0.8846612267351243, + "learning_rate": 2.306958833776474e-05, + "loss": 0.9869, + "mean_token_accuracy": 0.704833859205246, + "num_tokens": 237896233.0, + "step": 96490 + }, + { + "epoch": 0.8847529109746035, + "learning_rate": 2.305125148986889e-05, + "loss": 0.9797, + "mean_token_accuracy": 0.7050725817680359, + "num_tokens": 237924634.0, + "step": 96500 + }, + { + "epoch": 0.8848445952140827, + "learning_rate": 2.3032914641973046e-05, + "loss": 0.9679, + "mean_token_accuracy": 0.7066472947597504, + "num_tokens": 237953567.0, + "step": 96510 + }, + { + "epoch": 0.8849362794535619, + "learning_rate": 2.3014577794077198e-05, + "loss": 0.9672, + "mean_token_accuracy": 0.7009207725524902, + "num_tokens": 237981852.0, + "step": 96520 + }, + { + "epoch": 0.8850279636930412, + "learning_rate": 2.2996240946181353e-05, + "loss": 0.9553, + "mean_token_accuracy": 0.7090889692306519, + "num_tokens": 238009713.0, + "step": 96530 + }, + { + "epoch": 0.8851196479325204, + "learning_rate": 2.2977904098285505e-05, + "loss": 1.0145, + "mean_token_accuracy": 0.6924037039279938, + "num_tokens": 238037679.0, + "step": 96540 + }, + { + "epoch": 0.8852113321719997, + "learning_rate": 2.295956725038966e-05, + "loss": 0.9701, + "mean_token_accuracy": 0.7095661163330078, + "num_tokens": 238065350.0, + "step": 96550 + }, + { + "epoch": 0.8853030164114789, + "learning_rate": 2.2941230402493812e-05, + "loss": 0.9667, + "mean_token_accuracy": 0.7087648987770081, + "num_tokens": 238094915.0, + "step": 96560 + }, + { + "epoch": 0.8853947006509582, + "learning_rate": 2.2922893554597964e-05, + "loss": 0.9943, + "mean_token_accuracy": 0.7007356286048889, + "num_tokens": 238123245.0, + "step": 96570 + }, + { + "epoch": 0.8854863848904373, + "learning_rate": 2.290455670670212e-05, + "loss": 0.9883, + "mean_token_accuracy": 0.707362300157547, + "num_tokens": 238151699.0, + "step": 96580 + }, + { + "epoch": 0.8855780691299165, + "learning_rate": 2.288621985880627e-05, + "loss": 0.9578, + "mean_token_accuracy": 0.7084274351596832, + "num_tokens": 238179378.0, + "step": 96590 + }, + { + "epoch": 0.8856697533693958, + "learning_rate": 2.2867883010910427e-05, + "loss": 0.9346, + "mean_token_accuracy": 0.7091085612773895, + "num_tokens": 238206805.0, + "step": 96600 + }, + { + "epoch": 0.885761437608875, + "learning_rate": 2.284954616301458e-05, + "loss": 0.9826, + "mean_token_accuracy": 0.7047915995121002, + "num_tokens": 238235084.0, + "step": 96610 + }, + { + "epoch": 0.8858531218483543, + "learning_rate": 2.283120931511873e-05, + "loss": 0.9923, + "mean_token_accuracy": 0.7035689234733582, + "num_tokens": 238263579.0, + "step": 96620 + }, + { + "epoch": 0.8859448060878335, + "learning_rate": 2.2812872467222886e-05, + "loss": 0.97, + "mean_token_accuracy": 0.7095637738704681, + "num_tokens": 238291103.0, + "step": 96630 + }, + { + "epoch": 0.8860364903273127, + "learning_rate": 2.279453561932704e-05, + "loss": 0.9359, + "mean_token_accuracy": 0.7145771861076355, + "num_tokens": 238318154.0, + "step": 96640 + }, + { + "epoch": 0.8861281745667919, + "learning_rate": 2.2776198771431193e-05, + "loss": 0.9982, + "mean_token_accuracy": 0.6963150262832641, + "num_tokens": 238345981.0, + "step": 96650 + }, + { + "epoch": 0.8862198588062712, + "learning_rate": 2.2757861923535345e-05, + "loss": 0.924, + "mean_token_accuracy": 0.7200303912162781, + "num_tokens": 238374039.0, + "step": 96660 + }, + { + "epoch": 0.8863115430457504, + "learning_rate": 2.2739525075639496e-05, + "loss": 0.9494, + "mean_token_accuracy": 0.7126326620578766, + "num_tokens": 238401339.0, + "step": 96670 + }, + { + "epoch": 0.8864032272852297, + "learning_rate": 2.2721188227743652e-05, + "loss": 0.9689, + "mean_token_accuracy": 0.7026102662086486, + "num_tokens": 238429213.0, + "step": 96680 + }, + { + "epoch": 0.8864949115247089, + "learning_rate": 2.2702851379847807e-05, + "loss": 0.9732, + "mean_token_accuracy": 0.7079392790794372, + "num_tokens": 238458508.0, + "step": 96690 + }, + { + "epoch": 0.8865865957641882, + "learning_rate": 2.268451453195196e-05, + "loss": 0.9415, + "mean_token_accuracy": 0.7129162967205047, + "num_tokens": 238486420.0, + "step": 96700 + }, + { + "epoch": 0.8866782800036673, + "learning_rate": 2.266617768405611e-05, + "loss": 0.9727, + "mean_token_accuracy": 0.7034138381481171, + "num_tokens": 238514631.0, + "step": 96710 + }, + { + "epoch": 0.8867699642431466, + "learning_rate": 2.2647840836160263e-05, + "loss": 0.9675, + "mean_token_accuracy": 0.7059114933013916, + "num_tokens": 238543042.0, + "step": 96720 + }, + { + "epoch": 0.8868616484826258, + "learning_rate": 2.2629503988264418e-05, + "loss": 0.9776, + "mean_token_accuracy": 0.7054970860481262, + "num_tokens": 238571414.0, + "step": 96730 + }, + { + "epoch": 0.8869533327221051, + "learning_rate": 2.2611167140368573e-05, + "loss": 0.9637, + "mean_token_accuracy": 0.7084570229053497, + "num_tokens": 238599175.0, + "step": 96740 + }, + { + "epoch": 0.8870450169615843, + "learning_rate": 2.2592830292472725e-05, + "loss": 0.9901, + "mean_token_accuracy": 0.7020326614379883, + "num_tokens": 238626897.0, + "step": 96750 + }, + { + "epoch": 0.8871367012010636, + "learning_rate": 2.2574493444576877e-05, + "loss": 0.9427, + "mean_token_accuracy": 0.7104795098304748, + "num_tokens": 238655498.0, + "step": 96760 + }, + { + "epoch": 0.8872283854405427, + "learning_rate": 2.2556156596681032e-05, + "loss": 0.9625, + "mean_token_accuracy": 0.710882818698883, + "num_tokens": 238684165.0, + "step": 96770 + }, + { + "epoch": 0.887320069680022, + "learning_rate": 2.2537819748785184e-05, + "loss": 0.9437, + "mean_token_accuracy": 0.7077939689159394, + "num_tokens": 238712287.0, + "step": 96780 + }, + { + "epoch": 0.8874117539195012, + "learning_rate": 2.251948290088934e-05, + "loss": 0.9751, + "mean_token_accuracy": 0.7079537868499756, + "num_tokens": 238741552.0, + "step": 96790 + }, + { + "epoch": 0.8875034381589805, + "learning_rate": 2.250114605299349e-05, + "loss": 0.9492, + "mean_token_accuracy": 0.7128849506378174, + "num_tokens": 238769951.0, + "step": 96800 + }, + { + "epoch": 0.8875951223984597, + "learning_rate": 2.2482809205097643e-05, + "loss": 0.9676, + "mean_token_accuracy": 0.7078661918640137, + "num_tokens": 238798496.0, + "step": 96810 + }, + { + "epoch": 0.887686806637939, + "learning_rate": 2.2464472357201798e-05, + "loss": 0.9743, + "mean_token_accuracy": 0.705557507276535, + "num_tokens": 238827458.0, + "step": 96820 + }, + { + "epoch": 0.8877784908774182, + "learning_rate": 2.244613550930595e-05, + "loss": 0.9806, + "mean_token_accuracy": 0.7007512450218201, + "num_tokens": 238856477.0, + "step": 96830 + }, + { + "epoch": 0.8878701751168974, + "learning_rate": 2.2427798661410105e-05, + "loss": 0.9746, + "mean_token_accuracy": 0.7021511018276214, + "num_tokens": 238884243.0, + "step": 96840 + }, + { + "epoch": 0.8879618593563766, + "learning_rate": 2.2409461813514257e-05, + "loss": 0.9804, + "mean_token_accuracy": 0.703189742565155, + "num_tokens": 238912612.0, + "step": 96850 + }, + { + "epoch": 0.8880535435958559, + "learning_rate": 2.2391124965618412e-05, + "loss": 0.9405, + "mean_token_accuracy": 0.7142318785190582, + "num_tokens": 238940807.0, + "step": 96860 + }, + { + "epoch": 0.8881452278353351, + "learning_rate": 2.2372788117722564e-05, + "loss": 0.9313, + "mean_token_accuracy": 0.7137115716934204, + "num_tokens": 238968612.0, + "step": 96870 + }, + { + "epoch": 0.8882369120748144, + "learning_rate": 2.2354451269826716e-05, + "loss": 0.9161, + "mean_token_accuracy": 0.7169967651367187, + "num_tokens": 238996205.0, + "step": 96880 + }, + { + "epoch": 0.8883285963142936, + "learning_rate": 2.233611442193087e-05, + "loss": 0.9827, + "mean_token_accuracy": 0.7005254030227661, + "num_tokens": 239024865.0, + "step": 96890 + }, + { + "epoch": 0.8884202805537728, + "learning_rate": 2.2317777574035023e-05, + "loss": 0.9743, + "mean_token_accuracy": 0.7017959892749787, + "num_tokens": 239053388.0, + "step": 96900 + }, + { + "epoch": 0.888511964793252, + "learning_rate": 2.229944072613918e-05, + "loss": 0.9964, + "mean_token_accuracy": 0.7043148577213287, + "num_tokens": 239082342.0, + "step": 96910 + }, + { + "epoch": 0.8886036490327313, + "learning_rate": 2.228110387824333e-05, + "loss": 0.9737, + "mean_token_accuracy": 0.702905124425888, + "num_tokens": 239111159.0, + "step": 96920 + }, + { + "epoch": 0.8886953332722105, + "learning_rate": 2.2262767030347482e-05, + "loss": 0.9568, + "mean_token_accuracy": 0.706221753358841, + "num_tokens": 239140197.0, + "step": 96930 + }, + { + "epoch": 0.8887870175116898, + "learning_rate": 2.2244430182451638e-05, + "loss": 0.9881, + "mean_token_accuracy": 0.7017104625701904, + "num_tokens": 239168682.0, + "step": 96940 + }, + { + "epoch": 0.888878701751169, + "learning_rate": 2.2226093334555793e-05, + "loss": 0.9631, + "mean_token_accuracy": 0.7079795181751252, + "num_tokens": 239197190.0, + "step": 96950 + }, + { + "epoch": 0.8889703859906483, + "learning_rate": 2.2207756486659945e-05, + "loss": 0.9418, + "mean_token_accuracy": 0.7149965763092041, + "num_tokens": 239224099.0, + "step": 96960 + }, + { + "epoch": 0.8890620702301274, + "learning_rate": 2.2189419638764097e-05, + "loss": 0.9304, + "mean_token_accuracy": 0.7135801434516906, + "num_tokens": 239252220.0, + "step": 96970 + }, + { + "epoch": 0.8891537544696066, + "learning_rate": 2.217108279086825e-05, + "loss": 0.9858, + "mean_token_accuracy": 0.7067170798778534, + "num_tokens": 239280284.0, + "step": 96980 + }, + { + "epoch": 0.8892454387090859, + "learning_rate": 2.2152745942972407e-05, + "loss": 0.9569, + "mean_token_accuracy": 0.709110152721405, + "num_tokens": 239307859.0, + "step": 96990 + }, + { + "epoch": 0.8893371229485652, + "learning_rate": 2.213440909507656e-05, + "loss": 0.9806, + "mean_token_accuracy": 0.7043768763542175, + "num_tokens": 239336514.0, + "step": 97000 + }, + { + "epoch": 0.8894288071880444, + "learning_rate": 2.211607224718071e-05, + "loss": 0.9746, + "mean_token_accuracy": 0.7031792461872101, + "num_tokens": 239365349.0, + "step": 97010 + }, + { + "epoch": 0.8895204914275237, + "learning_rate": 2.2097735399284863e-05, + "loss": 0.9405, + "mean_token_accuracy": 0.7163421332836151, + "num_tokens": 239393319.0, + "step": 97020 + }, + { + "epoch": 0.8896121756670028, + "learning_rate": 2.2079398551389015e-05, + "loss": 0.9584, + "mean_token_accuracy": 0.7097893059253693, + "num_tokens": 239420833.0, + "step": 97030 + }, + { + "epoch": 0.889703859906482, + "learning_rate": 2.2061061703493173e-05, + "loss": 0.963, + "mean_token_accuracy": 0.7110153555870056, + "num_tokens": 239448339.0, + "step": 97040 + }, + { + "epoch": 0.8897955441459613, + "learning_rate": 2.2042724855597325e-05, + "loss": 0.9649, + "mean_token_accuracy": 0.7093183338642121, + "num_tokens": 239476061.0, + "step": 97050 + }, + { + "epoch": 0.8898872283854405, + "learning_rate": 2.2024388007701477e-05, + "loss": 0.9976, + "mean_token_accuracy": 0.7013116657733918, + "num_tokens": 239503886.0, + "step": 97060 + }, + { + "epoch": 0.8899789126249198, + "learning_rate": 2.200605115980563e-05, + "loss": 0.9559, + "mean_token_accuracy": 0.7107174158096313, + "num_tokens": 239531527.0, + "step": 97070 + }, + { + "epoch": 0.890070596864399, + "learning_rate": 2.1987714311909784e-05, + "loss": 0.9431, + "mean_token_accuracy": 0.713870745897293, + "num_tokens": 239558029.0, + "step": 97080 + }, + { + "epoch": 0.8901622811038783, + "learning_rate": 2.196937746401394e-05, + "loss": 0.9742, + "mean_token_accuracy": 0.7022699773311615, + "num_tokens": 239586449.0, + "step": 97090 + }, + { + "epoch": 0.8902539653433574, + "learning_rate": 2.195104061611809e-05, + "loss": 0.9516, + "mean_token_accuracy": 0.7131372094154358, + "num_tokens": 239614337.0, + "step": 97100 + }, + { + "epoch": 0.8903456495828367, + "learning_rate": 2.1932703768222243e-05, + "loss": 0.9785, + "mean_token_accuracy": 0.7015217185020447, + "num_tokens": 239640820.0, + "step": 97110 + }, + { + "epoch": 0.8904373338223159, + "learning_rate": 2.1914366920326395e-05, + "loss": 0.9467, + "mean_token_accuracy": 0.7167421400547027, + "num_tokens": 239669059.0, + "step": 97120 + }, + { + "epoch": 0.8905290180617952, + "learning_rate": 2.189603007243055e-05, + "loss": 0.9918, + "mean_token_accuracy": 0.7034554660320282, + "num_tokens": 239697143.0, + "step": 97130 + }, + { + "epoch": 0.8906207023012744, + "learning_rate": 2.1877693224534705e-05, + "loss": 0.9442, + "mean_token_accuracy": 0.7145998239517212, + "num_tokens": 239725341.0, + "step": 97140 + }, + { + "epoch": 0.8907123865407537, + "learning_rate": 2.1859356376638857e-05, + "loss": 0.9939, + "mean_token_accuracy": 0.7020884215831756, + "num_tokens": 239753977.0, + "step": 97150 + }, + { + "epoch": 0.8908040707802328, + "learning_rate": 2.184101952874301e-05, + "loss": 0.934, + "mean_token_accuracy": 0.718560802936554, + "num_tokens": 239780901.0, + "step": 97160 + }, + { + "epoch": 0.8908957550197121, + "learning_rate": 2.1822682680847164e-05, + "loss": 0.9922, + "mean_token_accuracy": 0.7035746157169342, + "num_tokens": 239808979.0, + "step": 97170 + }, + { + "epoch": 0.8909874392591913, + "learning_rate": 2.1804345832951316e-05, + "loss": 0.9862, + "mean_token_accuracy": 0.702910327911377, + "num_tokens": 239837834.0, + "step": 97180 + }, + { + "epoch": 0.8910791234986706, + "learning_rate": 2.178600898505547e-05, + "loss": 0.9433, + "mean_token_accuracy": 0.7108165144920349, + "num_tokens": 239865397.0, + "step": 97190 + }, + { + "epoch": 0.8911708077381498, + "learning_rate": 2.1767672137159623e-05, + "loss": 0.9445, + "mean_token_accuracy": 0.7101834297180176, + "num_tokens": 239893456.0, + "step": 97200 + }, + { + "epoch": 0.8912624919776291, + "learning_rate": 2.1749335289263775e-05, + "loss": 0.9576, + "mean_token_accuracy": 0.7073729932308197, + "num_tokens": 239921202.0, + "step": 97210 + }, + { + "epoch": 0.8913541762171083, + "learning_rate": 2.173099844136793e-05, + "loss": 0.9374, + "mean_token_accuracy": 0.7145473480224609, + "num_tokens": 239949475.0, + "step": 97220 + }, + { + "epoch": 0.8914458604565875, + "learning_rate": 2.1712661593472082e-05, + "loss": 0.9846, + "mean_token_accuracy": 0.7072529911994934, + "num_tokens": 239977541.0, + "step": 97230 + }, + { + "epoch": 0.8915375446960667, + "learning_rate": 2.1694324745576238e-05, + "loss": 0.9614, + "mean_token_accuracy": 0.70999316573143, + "num_tokens": 240004967.0, + "step": 97240 + }, + { + "epoch": 0.891629228935546, + "learning_rate": 2.167598789768039e-05, + "loss": 0.9391, + "mean_token_accuracy": 0.7105208516120911, + "num_tokens": 240033137.0, + "step": 97250 + }, + { + "epoch": 0.8917209131750252, + "learning_rate": 2.1657651049784545e-05, + "loss": 0.9743, + "mean_token_accuracy": 0.7062634706497193, + "num_tokens": 240060370.0, + "step": 97260 + }, + { + "epoch": 0.8918125974145045, + "learning_rate": 2.1639314201888697e-05, + "loss": 0.9827, + "mean_token_accuracy": 0.7027591407299042, + "num_tokens": 240088910.0, + "step": 97270 + }, + { + "epoch": 0.8919042816539837, + "learning_rate": 2.162097735399285e-05, + "loss": 0.951, + "mean_token_accuracy": 0.7139334440231323, + "num_tokens": 240116855.0, + "step": 97280 + }, + { + "epoch": 0.8919959658934629, + "learning_rate": 2.1602640506097004e-05, + "loss": 0.9578, + "mean_token_accuracy": 0.711462140083313, + "num_tokens": 240144392.0, + "step": 97290 + }, + { + "epoch": 0.8920876501329421, + "learning_rate": 2.158430365820116e-05, + "loss": 0.9811, + "mean_token_accuracy": 0.7059013426303864, + "num_tokens": 240171591.0, + "step": 97300 + }, + { + "epoch": 0.8921793343724214, + "learning_rate": 2.156596681030531e-05, + "loss": 0.9846, + "mean_token_accuracy": 0.70493643283844, + "num_tokens": 240199999.0, + "step": 97310 + }, + { + "epoch": 0.8922710186119006, + "learning_rate": 2.1547629962409463e-05, + "loss": 0.9725, + "mean_token_accuracy": 0.7052574157714844, + "num_tokens": 240228436.0, + "step": 97320 + }, + { + "epoch": 0.8923627028513799, + "learning_rate": 2.1529293114513615e-05, + "loss": 0.9705, + "mean_token_accuracy": 0.710043752193451, + "num_tokens": 240255741.0, + "step": 97330 + }, + { + "epoch": 0.8924543870908591, + "learning_rate": 2.151095626661777e-05, + "loss": 0.9806, + "mean_token_accuracy": 0.7028496623039245, + "num_tokens": 240284504.0, + "step": 97340 + }, + { + "epoch": 0.8925460713303384, + "learning_rate": 2.1492619418721925e-05, + "loss": 0.9851, + "mean_token_accuracy": 0.7029170513153076, + "num_tokens": 240313451.0, + "step": 97350 + }, + { + "epoch": 0.8926377555698175, + "learning_rate": 2.1474282570826077e-05, + "loss": 0.9343, + "mean_token_accuracy": 0.71030895113945, + "num_tokens": 240341868.0, + "step": 97360 + }, + { + "epoch": 0.8927294398092968, + "learning_rate": 2.145594572293023e-05, + "loss": 0.9954, + "mean_token_accuracy": 0.7004880666732788, + "num_tokens": 240369515.0, + "step": 97370 + }, + { + "epoch": 0.892821124048776, + "learning_rate": 2.143760887503438e-05, + "loss": 0.9662, + "mean_token_accuracy": 0.7119122266769409, + "num_tokens": 240398227.0, + "step": 97380 + }, + { + "epoch": 0.8929128082882553, + "learning_rate": 2.1419272027138536e-05, + "loss": 0.9702, + "mean_token_accuracy": 0.7040501415729523, + "num_tokens": 240426108.0, + "step": 97390 + }, + { + "epoch": 0.8930044925277345, + "learning_rate": 2.140093517924269e-05, + "loss": 0.9702, + "mean_token_accuracy": 0.7058905005455017, + "num_tokens": 240454373.0, + "step": 97400 + }, + { + "epoch": 0.8930961767672138, + "learning_rate": 2.1382598331346843e-05, + "loss": 0.9967, + "mean_token_accuracy": 0.6971623063087463, + "num_tokens": 240483144.0, + "step": 97410 + }, + { + "epoch": 0.8931878610066929, + "learning_rate": 2.1364261483450995e-05, + "loss": 0.9838, + "mean_token_accuracy": 0.7018255293369293, + "num_tokens": 240510562.0, + "step": 97420 + }, + { + "epoch": 0.8932795452461721, + "learning_rate": 2.1345924635555147e-05, + "loss": 0.9558, + "mean_token_accuracy": 0.7107691287994384, + "num_tokens": 240539387.0, + "step": 97430 + }, + { + "epoch": 0.8933712294856514, + "learning_rate": 2.1327587787659302e-05, + "loss": 0.9911, + "mean_token_accuracy": 0.7008166253566742, + "num_tokens": 240566876.0, + "step": 97440 + }, + { + "epoch": 0.8934629137251306, + "learning_rate": 2.1309250939763457e-05, + "loss": 0.9847, + "mean_token_accuracy": 0.7042464196681977, + "num_tokens": 240594001.0, + "step": 97450 + }, + { + "epoch": 0.8935545979646099, + "learning_rate": 2.129091409186761e-05, + "loss": 0.9485, + "mean_token_accuracy": 0.7077670335769654, + "num_tokens": 240621941.0, + "step": 97460 + }, + { + "epoch": 0.8936462822040891, + "learning_rate": 2.127257724397176e-05, + "loss": 0.9822, + "mean_token_accuracy": 0.7049382746219635, + "num_tokens": 240649252.0, + "step": 97470 + }, + { + "epoch": 0.8937379664435684, + "learning_rate": 2.1254240396075916e-05, + "loss": 0.9271, + "mean_token_accuracy": 0.7190112054347992, + "num_tokens": 240676809.0, + "step": 97480 + }, + { + "epoch": 0.8938296506830475, + "learning_rate": 2.1235903548180068e-05, + "loss": 0.9588, + "mean_token_accuracy": 0.7135937631130218, + "num_tokens": 240705868.0, + "step": 97490 + }, + { + "epoch": 0.8939213349225268, + "learning_rate": 2.1217566700284223e-05, + "loss": 0.976, + "mean_token_accuracy": 0.7038445949554444, + "num_tokens": 240733608.0, + "step": 97500 + }, + { + "epoch": 0.894013019162006, + "learning_rate": 2.1199229852388375e-05, + "loss": 0.9703, + "mean_token_accuracy": 0.7072181105613708, + "num_tokens": 240762169.0, + "step": 97510 + }, + { + "epoch": 0.8941047034014853, + "learning_rate": 2.1180893004492527e-05, + "loss": 0.9749, + "mean_token_accuracy": 0.7093082249164582, + "num_tokens": 240790284.0, + "step": 97520 + }, + { + "epoch": 0.8941963876409645, + "learning_rate": 2.1162556156596682e-05, + "loss": 0.9496, + "mean_token_accuracy": 0.7182524740695954, + "num_tokens": 240818279.0, + "step": 97530 + }, + { + "epoch": 0.8942880718804438, + "learning_rate": 2.1144219308700834e-05, + "loss": 0.9908, + "mean_token_accuracy": 0.7036314368247986, + "num_tokens": 240846334.0, + "step": 97540 + }, + { + "epoch": 0.8943797561199229, + "learning_rate": 2.112588246080499e-05, + "loss": 0.9266, + "mean_token_accuracy": 0.7167088270187378, + "num_tokens": 240874300.0, + "step": 97550 + }, + { + "epoch": 0.8944714403594022, + "learning_rate": 2.110754561290914e-05, + "loss": 0.9477, + "mean_token_accuracy": 0.7165841042995453, + "num_tokens": 240901484.0, + "step": 97560 + }, + { + "epoch": 0.8945631245988814, + "learning_rate": 2.1089208765013297e-05, + "loss": 0.9992, + "mean_token_accuracy": 0.704637223482132, + "num_tokens": 240930147.0, + "step": 97570 + }, + { + "epoch": 0.8946548088383607, + "learning_rate": 2.107087191711745e-05, + "loss": 0.9664, + "mean_token_accuracy": 0.7051290452480317, + "num_tokens": 240958434.0, + "step": 97580 + }, + { + "epoch": 0.8947464930778399, + "learning_rate": 2.10525350692216e-05, + "loss": 0.9558, + "mean_token_accuracy": 0.7086008548736572, + "num_tokens": 240986338.0, + "step": 97590 + }, + { + "epoch": 0.8948381773173192, + "learning_rate": 2.1034198221325756e-05, + "loss": 0.9603, + "mean_token_accuracy": 0.705905967950821, + "num_tokens": 241014936.0, + "step": 97600 + }, + { + "epoch": 0.8949298615567984, + "learning_rate": 2.1015861373429908e-05, + "loss": 0.9688, + "mean_token_accuracy": 0.7053589344024658, + "num_tokens": 241041784.0, + "step": 97610 + }, + { + "epoch": 0.8950215457962776, + "learning_rate": 2.0997524525534063e-05, + "loss": 0.9545, + "mean_token_accuracy": 0.707834267616272, + "num_tokens": 241069063.0, + "step": 97620 + }, + { + "epoch": 0.8951132300357568, + "learning_rate": 2.0979187677638215e-05, + "loss": 1.0178, + "mean_token_accuracy": 0.6941853821277618, + "num_tokens": 241097606.0, + "step": 97630 + }, + { + "epoch": 0.8952049142752361, + "learning_rate": 2.0960850829742367e-05, + "loss": 0.9389, + "mean_token_accuracy": 0.7142586946487427, + "num_tokens": 241125382.0, + "step": 97640 + }, + { + "epoch": 0.8952965985147153, + "learning_rate": 2.0942513981846522e-05, + "loss": 0.9715, + "mean_token_accuracy": 0.704793119430542, + "num_tokens": 241152699.0, + "step": 97650 + }, + { + "epoch": 0.8953882827541946, + "learning_rate": 2.0924177133950677e-05, + "loss": 0.9581, + "mean_token_accuracy": 0.7088997960090637, + "num_tokens": 241181195.0, + "step": 97660 + }, + { + "epoch": 0.8954799669936738, + "learning_rate": 2.090584028605483e-05, + "loss": 0.9943, + "mean_token_accuracy": 0.7021056711673737, + "num_tokens": 241209766.0, + "step": 97670 + }, + { + "epoch": 0.895571651233153, + "learning_rate": 2.088750343815898e-05, + "loss": 0.9612, + "mean_token_accuracy": 0.7067963480949402, + "num_tokens": 241237038.0, + "step": 97680 + }, + { + "epoch": 0.8956633354726322, + "learning_rate": 2.0869166590263133e-05, + "loss": 0.9515, + "mean_token_accuracy": 0.7101170957088471, + "num_tokens": 241265491.0, + "step": 97690 + }, + { + "epoch": 0.8957550197121115, + "learning_rate": 2.0850829742367288e-05, + "loss": 0.9481, + "mean_token_accuracy": 0.7074155569076538, + "num_tokens": 241292131.0, + "step": 97700 + }, + { + "epoch": 0.8958467039515907, + "learning_rate": 2.0832492894471443e-05, + "loss": 0.9605, + "mean_token_accuracy": 0.7086700677871705, + "num_tokens": 241319995.0, + "step": 97710 + }, + { + "epoch": 0.89593838819107, + "learning_rate": 2.0814156046575595e-05, + "loss": 0.9693, + "mean_token_accuracy": 0.7046679139137269, + "num_tokens": 241347349.0, + "step": 97720 + }, + { + "epoch": 0.8960300724305492, + "learning_rate": 2.0795819198679747e-05, + "loss": 0.9346, + "mean_token_accuracy": 0.7158856809139251, + "num_tokens": 241374999.0, + "step": 97730 + }, + { + "epoch": 0.8961217566700285, + "learning_rate": 2.07774823507839e-05, + "loss": 0.9811, + "mean_token_accuracy": 0.7040074944496155, + "num_tokens": 241402937.0, + "step": 97740 + }, + { + "epoch": 0.8962134409095076, + "learning_rate": 2.0759145502888054e-05, + "loss": 0.961, + "mean_token_accuracy": 0.7127393186092377, + "num_tokens": 241431821.0, + "step": 97750 + }, + { + "epoch": 0.8963051251489869, + "learning_rate": 2.074080865499221e-05, + "loss": 0.9859, + "mean_token_accuracy": 0.702030336856842, + "num_tokens": 241460322.0, + "step": 97760 + }, + { + "epoch": 0.8963968093884661, + "learning_rate": 2.072247180709636e-05, + "loss": 0.9521, + "mean_token_accuracy": 0.7114170610904693, + "num_tokens": 241487720.0, + "step": 97770 + }, + { + "epoch": 0.8964884936279454, + "learning_rate": 2.0704134959200513e-05, + "loss": 0.9699, + "mean_token_accuracy": 0.7097540855407715, + "num_tokens": 241515097.0, + "step": 97780 + }, + { + "epoch": 0.8965801778674246, + "learning_rate": 2.0685798111304668e-05, + "loss": 0.9837, + "mean_token_accuracy": 0.7047342956066132, + "num_tokens": 241543472.0, + "step": 97790 + }, + { + "epoch": 0.8966718621069039, + "learning_rate": 2.066746126340882e-05, + "loss": 0.9605, + "mean_token_accuracy": 0.7147351503372192, + "num_tokens": 241571616.0, + "step": 97800 + }, + { + "epoch": 0.8967635463463831, + "learning_rate": 2.0649124415512975e-05, + "loss": 0.9441, + "mean_token_accuracy": 0.7077078938484191, + "num_tokens": 241600183.0, + "step": 97810 + }, + { + "epoch": 0.8968552305858623, + "learning_rate": 2.0630787567617127e-05, + "loss": 0.9806, + "mean_token_accuracy": 0.7040668785572052, + "num_tokens": 241627875.0, + "step": 97820 + }, + { + "epoch": 0.8969469148253415, + "learning_rate": 2.061245071972128e-05, + "loss": 0.9481, + "mean_token_accuracy": 0.7153401970863342, + "num_tokens": 241655914.0, + "step": 97830 + }, + { + "epoch": 0.8970385990648208, + "learning_rate": 2.0594113871825434e-05, + "loss": 0.9467, + "mean_token_accuracy": 0.7099112391471862, + "num_tokens": 241683316.0, + "step": 97840 + }, + { + "epoch": 0.8971302833043, + "learning_rate": 2.0575777023929586e-05, + "loss": 0.9543, + "mean_token_accuracy": 0.7093935608863831, + "num_tokens": 241712258.0, + "step": 97850 + }, + { + "epoch": 0.8972219675437793, + "learning_rate": 2.055744017603374e-05, + "loss": 0.9511, + "mean_token_accuracy": 0.7118758618831634, + "num_tokens": 241741411.0, + "step": 97860 + }, + { + "epoch": 0.8973136517832585, + "learning_rate": 2.0539103328137893e-05, + "loss": 0.9746, + "mean_token_accuracy": 0.7053055465221405, + "num_tokens": 241768167.0, + "step": 97870 + }, + { + "epoch": 0.8974053360227376, + "learning_rate": 2.052076648024205e-05, + "loss": 0.9862, + "mean_token_accuracy": 0.7043285131454468, + "num_tokens": 241795756.0, + "step": 97880 + }, + { + "epoch": 0.8974970202622169, + "learning_rate": 2.05024296323462e-05, + "loss": 0.9676, + "mean_token_accuracy": 0.7091193974018097, + "num_tokens": 241824214.0, + "step": 97890 + }, + { + "epoch": 0.8975887045016961, + "learning_rate": 2.0484092784450352e-05, + "loss": 0.9547, + "mean_token_accuracy": 0.7121727526187897, + "num_tokens": 241851507.0, + "step": 97900 + }, + { + "epoch": 0.8976803887411754, + "learning_rate": 2.0465755936554508e-05, + "loss": 0.9444, + "mean_token_accuracy": 0.7150976479053497, + "num_tokens": 241878894.0, + "step": 97910 + }, + { + "epoch": 0.8977720729806546, + "learning_rate": 2.044741908865866e-05, + "loss": 0.939, + "mean_token_accuracy": 0.7140742897987366, + "num_tokens": 241908163.0, + "step": 97920 + }, + { + "epoch": 0.8978637572201339, + "learning_rate": 2.0429082240762815e-05, + "loss": 0.9576, + "mean_token_accuracy": 0.7055696487426758, + "num_tokens": 241937421.0, + "step": 97930 + }, + { + "epoch": 0.8979554414596131, + "learning_rate": 2.0410745392866967e-05, + "loss": 0.9352, + "mean_token_accuracy": 0.7135234117507935, + "num_tokens": 241965751.0, + "step": 97940 + }, + { + "epoch": 0.8980471256990923, + "learning_rate": 2.039240854497112e-05, + "loss": 0.9555, + "mean_token_accuracy": 0.7085389316082, + "num_tokens": 241994856.0, + "step": 97950 + }, + { + "epoch": 0.8981388099385715, + "learning_rate": 2.0374071697075274e-05, + "loss": 0.9718, + "mean_token_accuracy": 0.7018843948841095, + "num_tokens": 242022793.0, + "step": 97960 + }, + { + "epoch": 0.8982304941780508, + "learning_rate": 2.035573484917943e-05, + "loss": 0.9844, + "mean_token_accuracy": 0.700729638338089, + "num_tokens": 242050774.0, + "step": 97970 + }, + { + "epoch": 0.89832217841753, + "learning_rate": 2.033739800128358e-05, + "loss": 0.9406, + "mean_token_accuracy": 0.7121575176715851, + "num_tokens": 242078689.0, + "step": 97980 + }, + { + "epoch": 0.8984138626570093, + "learning_rate": 2.0319061153387733e-05, + "loss": 0.9529, + "mean_token_accuracy": 0.716164642572403, + "num_tokens": 242106528.0, + "step": 97990 + }, + { + "epoch": 0.8985055468964885, + "learning_rate": 2.0300724305491885e-05, + "loss": 0.9923, + "mean_token_accuracy": 0.6991463661193847, + "num_tokens": 242134110.0, + "step": 98000 + }, + { + "epoch": 0.8985972311359677, + "learning_rate": 2.028238745759604e-05, + "loss": 0.9581, + "mean_token_accuracy": 0.7144601285457611, + "num_tokens": 242161617.0, + "step": 98010 + }, + { + "epoch": 0.8986889153754469, + "learning_rate": 2.0264050609700195e-05, + "loss": 0.9762, + "mean_token_accuracy": 0.7069809973239899, + "num_tokens": 242190524.0, + "step": 98020 + }, + { + "epoch": 0.8987805996149262, + "learning_rate": 2.0245713761804347e-05, + "loss": 0.9535, + "mean_token_accuracy": 0.7110555589199066, + "num_tokens": 242218902.0, + "step": 98030 + }, + { + "epoch": 0.8988722838544054, + "learning_rate": 2.02273769139085e-05, + "loss": 0.9715, + "mean_token_accuracy": 0.7055911839008331, + "num_tokens": 242246071.0, + "step": 98040 + }, + { + "epoch": 0.8989639680938847, + "learning_rate": 2.020904006601265e-05, + "loss": 0.9596, + "mean_token_accuracy": 0.7030866265296936, + "num_tokens": 242274414.0, + "step": 98050 + }, + { + "epoch": 0.8990556523333639, + "learning_rate": 2.019070321811681e-05, + "loss": 0.9666, + "mean_token_accuracy": 0.7040348529815674, + "num_tokens": 242302623.0, + "step": 98060 + }, + { + "epoch": 0.8991473365728432, + "learning_rate": 2.017236637022096e-05, + "loss": 0.9532, + "mean_token_accuracy": 0.7138877093791962, + "num_tokens": 242331298.0, + "step": 98070 + }, + { + "epoch": 0.8992390208123223, + "learning_rate": 2.0154029522325113e-05, + "loss": 1.0112, + "mean_token_accuracy": 0.6944770693778992, + "num_tokens": 242359653.0, + "step": 98080 + }, + { + "epoch": 0.8993307050518016, + "learning_rate": 2.0135692674429265e-05, + "loss": 0.9643, + "mean_token_accuracy": 0.7098870873451233, + "num_tokens": 242388824.0, + "step": 98090 + }, + { + "epoch": 0.8994223892912808, + "learning_rate": 2.011735582653342e-05, + "loss": 0.9725, + "mean_token_accuracy": 0.7049516499042511, + "num_tokens": 242416601.0, + "step": 98100 + }, + { + "epoch": 0.8995140735307601, + "learning_rate": 2.0099018978637575e-05, + "loss": 0.9294, + "mean_token_accuracy": 0.7129597067832947, + "num_tokens": 242445464.0, + "step": 98110 + }, + { + "epoch": 0.8996057577702393, + "learning_rate": 2.0080682130741727e-05, + "loss": 0.9686, + "mean_token_accuracy": 0.7078495383262634, + "num_tokens": 242473337.0, + "step": 98120 + }, + { + "epoch": 0.8996974420097186, + "learning_rate": 2.006234528284588e-05, + "loss": 0.9496, + "mean_token_accuracy": 0.7084646999835968, + "num_tokens": 242502275.0, + "step": 98130 + }, + { + "epoch": 0.8997891262491977, + "learning_rate": 2.004400843495003e-05, + "loss": 1.0012, + "mean_token_accuracy": 0.703138554096222, + "num_tokens": 242530146.0, + "step": 98140 + }, + { + "epoch": 0.899880810488677, + "learning_rate": 2.0025671587054186e-05, + "loss": 0.982, + "mean_token_accuracy": 0.7043869853019714, + "num_tokens": 242557847.0, + "step": 98150 + }, + { + "epoch": 0.8999724947281562, + "learning_rate": 2.000733473915834e-05, + "loss": 0.972, + "mean_token_accuracy": 0.7044876873493194, + "num_tokens": 242586696.0, + "step": 98160 + }, + { + "epoch": 0.9000641789676355, + "learning_rate": 1.9988997891262493e-05, + "loss": 1.0118, + "mean_token_accuracy": 0.7073430299758912, + "num_tokens": 242614961.0, + "step": 98170 + }, + { + "epoch": 0.9001558632071147, + "learning_rate": 1.9970661043366645e-05, + "loss": 0.9528, + "mean_token_accuracy": 0.7149098515510559, + "num_tokens": 242643463.0, + "step": 98180 + }, + { + "epoch": 0.900247547446594, + "learning_rate": 1.99523241954708e-05, + "loss": 0.9449, + "mean_token_accuracy": 0.7118351042270661, + "num_tokens": 242672199.0, + "step": 98190 + }, + { + "epoch": 0.9003392316860732, + "learning_rate": 1.9933987347574952e-05, + "loss": 0.9504, + "mean_token_accuracy": 0.7106627702713013, + "num_tokens": 242700144.0, + "step": 98200 + }, + { + "epoch": 0.9004309159255524, + "learning_rate": 1.9915650499679108e-05, + "loss": 0.9515, + "mean_token_accuracy": 0.7086313486099243, + "num_tokens": 242728642.0, + "step": 98210 + }, + { + "epoch": 0.9005226001650316, + "learning_rate": 1.989731365178326e-05, + "loss": 0.9935, + "mean_token_accuracy": 0.7040349960327148, + "num_tokens": 242757097.0, + "step": 98220 + }, + { + "epoch": 0.9006142844045109, + "learning_rate": 1.987897680388741e-05, + "loss": 0.9826, + "mean_token_accuracy": 0.7031432092189789, + "num_tokens": 242785799.0, + "step": 98230 + }, + { + "epoch": 0.9007059686439901, + "learning_rate": 1.9860639955991567e-05, + "loss": 0.9377, + "mean_token_accuracy": 0.7090740144252777, + "num_tokens": 242813630.0, + "step": 98240 + }, + { + "epoch": 0.9007976528834694, + "learning_rate": 1.984230310809572e-05, + "loss": 0.9676, + "mean_token_accuracy": 0.7060315907001495, + "num_tokens": 242840394.0, + "step": 98250 + }, + { + "epoch": 0.9008893371229486, + "learning_rate": 1.9823966260199874e-05, + "loss": 0.973, + "mean_token_accuracy": 0.710243034362793, + "num_tokens": 242868857.0, + "step": 98260 + }, + { + "epoch": 0.9009810213624277, + "learning_rate": 1.9805629412304026e-05, + "loss": 0.9689, + "mean_token_accuracy": 0.7057923972606659, + "num_tokens": 242897116.0, + "step": 98270 + }, + { + "epoch": 0.901072705601907, + "learning_rate": 1.978729256440818e-05, + "loss": 0.9887, + "mean_token_accuracy": 0.7076674342155457, + "num_tokens": 242923929.0, + "step": 98280 + }, + { + "epoch": 0.9011643898413862, + "learning_rate": 1.9768955716512333e-05, + "loss": 0.929, + "mean_token_accuracy": 0.7210639715194702, + "num_tokens": 242951170.0, + "step": 98290 + }, + { + "epoch": 0.9012560740808655, + "learning_rate": 1.9750618868616485e-05, + "loss": 0.9481, + "mean_token_accuracy": 0.7090279400348664, + "num_tokens": 242978839.0, + "step": 98300 + }, + { + "epoch": 0.9013477583203447, + "learning_rate": 1.973228202072064e-05, + "loss": 0.947, + "mean_token_accuracy": 0.7095263004302979, + "num_tokens": 243006189.0, + "step": 98310 + }, + { + "epoch": 0.901439442559824, + "learning_rate": 1.9713945172824795e-05, + "loss": 0.9627, + "mean_token_accuracy": 0.7099762558937073, + "num_tokens": 243034368.0, + "step": 98320 + }, + { + "epoch": 0.9015311267993033, + "learning_rate": 1.9695608324928947e-05, + "loss": 0.9838, + "mean_token_accuracy": 0.7022603631019593, + "num_tokens": 243062477.0, + "step": 98330 + }, + { + "epoch": 0.9016228110387824, + "learning_rate": 1.96772714770331e-05, + "loss": 0.9514, + "mean_token_accuracy": 0.7108042061328887, + "num_tokens": 243090238.0, + "step": 98340 + }, + { + "epoch": 0.9017144952782616, + "learning_rate": 1.965893462913725e-05, + "loss": 0.9602, + "mean_token_accuracy": 0.708228987455368, + "num_tokens": 243118273.0, + "step": 98350 + }, + { + "epoch": 0.9018061795177409, + "learning_rate": 1.9640597781241406e-05, + "loss": 0.9663, + "mean_token_accuracy": 0.7075661361217499, + "num_tokens": 243146550.0, + "step": 98360 + }, + { + "epoch": 0.9018978637572201, + "learning_rate": 1.962226093334556e-05, + "loss": 0.9335, + "mean_token_accuracy": 0.7181289672851563, + "num_tokens": 243174904.0, + "step": 98370 + }, + { + "epoch": 0.9019895479966994, + "learning_rate": 1.9603924085449713e-05, + "loss": 0.9808, + "mean_token_accuracy": 0.7027455568313599, + "num_tokens": 243203644.0, + "step": 98380 + }, + { + "epoch": 0.9020812322361786, + "learning_rate": 1.9585587237553865e-05, + "loss": 0.9631, + "mean_token_accuracy": 0.7073743343353271, + "num_tokens": 243230956.0, + "step": 98390 + }, + { + "epoch": 0.9021729164756578, + "learning_rate": 1.9567250389658017e-05, + "loss": 0.9781, + "mean_token_accuracy": 0.7030749142169952, + "num_tokens": 243258979.0, + "step": 98400 + }, + { + "epoch": 0.902264600715137, + "learning_rate": 1.9548913541762172e-05, + "loss": 0.9357, + "mean_token_accuracy": 0.713792484998703, + "num_tokens": 243287241.0, + "step": 98410 + }, + { + "epoch": 0.9023562849546163, + "learning_rate": 1.9530576693866327e-05, + "loss": 0.944, + "mean_token_accuracy": 0.7122910678386688, + "num_tokens": 243315310.0, + "step": 98420 + }, + { + "epoch": 0.9024479691940955, + "learning_rate": 1.951223984597048e-05, + "loss": 0.9686, + "mean_token_accuracy": 0.7054218947887421, + "num_tokens": 243343271.0, + "step": 98430 + }, + { + "epoch": 0.9025396534335748, + "learning_rate": 1.949390299807463e-05, + "loss": 0.9403, + "mean_token_accuracy": 0.7059735238552094, + "num_tokens": 243371525.0, + "step": 98440 + }, + { + "epoch": 0.902631337673054, + "learning_rate": 1.9475566150178783e-05, + "loss": 0.9718, + "mean_token_accuracy": 0.70748171210289, + "num_tokens": 243399455.0, + "step": 98450 + }, + { + "epoch": 0.9027230219125333, + "learning_rate": 1.9457229302282938e-05, + "loss": 0.9467, + "mean_token_accuracy": 0.7119232892990113, + "num_tokens": 243426714.0, + "step": 98460 + }, + { + "epoch": 0.9028147061520124, + "learning_rate": 1.9438892454387094e-05, + "loss": 0.9364, + "mean_token_accuracy": 0.7129967391490937, + "num_tokens": 243455255.0, + "step": 98470 + }, + { + "epoch": 0.9029063903914917, + "learning_rate": 1.9420555606491245e-05, + "loss": 0.9252, + "mean_token_accuracy": 0.718877625465393, + "num_tokens": 243483096.0, + "step": 98480 + }, + { + "epoch": 0.9029980746309709, + "learning_rate": 1.9402218758595397e-05, + "loss": 0.9585, + "mean_token_accuracy": 0.7124249160289764, + "num_tokens": 243511074.0, + "step": 98490 + }, + { + "epoch": 0.9030897588704502, + "learning_rate": 1.9383881910699552e-05, + "loss": 0.9555, + "mean_token_accuracy": 0.7075623571872711, + "num_tokens": 243539196.0, + "step": 98500 + }, + { + "epoch": 0.9031814431099294, + "learning_rate": 1.9365545062803704e-05, + "loss": 0.9611, + "mean_token_accuracy": 0.7051093578338623, + "num_tokens": 243566995.0, + "step": 98510 + }, + { + "epoch": 0.9032731273494087, + "learning_rate": 1.934720821490786e-05, + "loss": 0.977, + "mean_token_accuracy": 0.706699115037918, + "num_tokens": 243594851.0, + "step": 98520 + }, + { + "epoch": 0.9033648115888878, + "learning_rate": 1.932887136701201e-05, + "loss": 0.9476, + "mean_token_accuracy": 0.7158394098281861, + "num_tokens": 243623453.0, + "step": 98530 + }, + { + "epoch": 0.9034564958283671, + "learning_rate": 1.9310534519116163e-05, + "loss": 0.9466, + "mean_token_accuracy": 0.7080992043018342, + "num_tokens": 243650900.0, + "step": 98540 + }, + { + "epoch": 0.9035481800678463, + "learning_rate": 1.929219767122032e-05, + "loss": 0.967, + "mean_token_accuracy": 0.7112585842609406, + "num_tokens": 243678387.0, + "step": 98550 + }, + { + "epoch": 0.9036398643073256, + "learning_rate": 1.927386082332447e-05, + "loss": 0.9418, + "mean_token_accuracy": 0.7078060448169708, + "num_tokens": 243706298.0, + "step": 98560 + }, + { + "epoch": 0.9037315485468048, + "learning_rate": 1.9255523975428626e-05, + "loss": 0.968, + "mean_token_accuracy": 0.7058828592300415, + "num_tokens": 243734181.0, + "step": 98570 + }, + { + "epoch": 0.9038232327862841, + "learning_rate": 1.9237187127532778e-05, + "loss": 0.9831, + "mean_token_accuracy": 0.7044422030448914, + "num_tokens": 243761708.0, + "step": 98580 + }, + { + "epoch": 0.9039149170257633, + "learning_rate": 1.9218850279636933e-05, + "loss": 0.948, + "mean_token_accuracy": 0.7123528182506561, + "num_tokens": 243789810.0, + "step": 98590 + }, + { + "epoch": 0.9040066012652425, + "learning_rate": 1.9200513431741085e-05, + "loss": 0.9378, + "mean_token_accuracy": 0.7146504878997803, + "num_tokens": 243817994.0, + "step": 98600 + }, + { + "epoch": 0.9040982855047217, + "learning_rate": 1.9182176583845237e-05, + "loss": 0.9505, + "mean_token_accuracy": 0.7088361203670501, + "num_tokens": 243845439.0, + "step": 98610 + }, + { + "epoch": 0.904189969744201, + "learning_rate": 1.9163839735949392e-05, + "loss": 0.9522, + "mean_token_accuracy": 0.7110304951667785, + "num_tokens": 243873228.0, + "step": 98620 + }, + { + "epoch": 0.9042816539836802, + "learning_rate": 1.9145502888053547e-05, + "loss": 0.9687, + "mean_token_accuracy": 0.7034121513366699, + "num_tokens": 243900947.0, + "step": 98630 + }, + { + "epoch": 0.9043733382231595, + "learning_rate": 1.91271660401577e-05, + "loss": 0.9489, + "mean_token_accuracy": 0.7118391335010529, + "num_tokens": 243929521.0, + "step": 98640 + }, + { + "epoch": 0.9044650224626387, + "learning_rate": 1.910882919226185e-05, + "loss": 0.9541, + "mean_token_accuracy": 0.7096317946910858, + "num_tokens": 243957669.0, + "step": 98650 + }, + { + "epoch": 0.9045567067021179, + "learning_rate": 1.9090492344366003e-05, + "loss": 0.9445, + "mean_token_accuracy": 0.7117459297180175, + "num_tokens": 243985484.0, + "step": 98660 + }, + { + "epoch": 0.9046483909415971, + "learning_rate": 1.9072155496470158e-05, + "loss": 0.9604, + "mean_token_accuracy": 0.7134973287582398, + "num_tokens": 244012831.0, + "step": 98670 + }, + { + "epoch": 0.9047400751810764, + "learning_rate": 1.9053818648574313e-05, + "loss": 0.9697, + "mean_token_accuracy": 0.7078468203544617, + "num_tokens": 244041318.0, + "step": 98680 + }, + { + "epoch": 0.9048317594205556, + "learning_rate": 1.9035481800678465e-05, + "loss": 0.9749, + "mean_token_accuracy": 0.6981931924819946, + "num_tokens": 244069948.0, + "step": 98690 + }, + { + "epoch": 0.9049234436600349, + "learning_rate": 1.9017144952782617e-05, + "loss": 0.9545, + "mean_token_accuracy": 0.7123080134391785, + "num_tokens": 244097819.0, + "step": 98700 + }, + { + "epoch": 0.9050151278995141, + "learning_rate": 1.899880810488677e-05, + "loss": 0.9694, + "mean_token_accuracy": 0.7063113808631897, + "num_tokens": 244125848.0, + "step": 98710 + }, + { + "epoch": 0.9051068121389934, + "learning_rate": 1.8980471256990924e-05, + "loss": 0.9544, + "mean_token_accuracy": 0.7099994361400604, + "num_tokens": 244154158.0, + "step": 98720 + }, + { + "epoch": 0.9051984963784725, + "learning_rate": 1.896213440909508e-05, + "loss": 0.9469, + "mean_token_accuracy": 0.7134117543697357, + "num_tokens": 244181368.0, + "step": 98730 + }, + { + "epoch": 0.9052901806179517, + "learning_rate": 1.894379756119923e-05, + "loss": 0.9588, + "mean_token_accuracy": 0.7087450921535492, + "num_tokens": 244209801.0, + "step": 98740 + }, + { + "epoch": 0.905381864857431, + "learning_rate": 1.8925460713303383e-05, + "loss": 0.9643, + "mean_token_accuracy": 0.7068106710910798, + "num_tokens": 244237529.0, + "step": 98750 + }, + { + "epoch": 0.9054735490969102, + "learning_rate": 1.8907123865407535e-05, + "loss": 0.9769, + "mean_token_accuracy": 0.7031436681747436, + "num_tokens": 244264568.0, + "step": 98760 + }, + { + "epoch": 0.9055652333363895, + "learning_rate": 1.888878701751169e-05, + "loss": 0.9577, + "mean_token_accuracy": 0.7108761012554169, + "num_tokens": 244292725.0, + "step": 98770 + }, + { + "epoch": 0.9056569175758687, + "learning_rate": 1.8870450169615845e-05, + "loss": 0.9686, + "mean_token_accuracy": 0.706019914150238, + "num_tokens": 244321019.0, + "step": 98780 + }, + { + "epoch": 0.9057486018153479, + "learning_rate": 1.8852113321719997e-05, + "loss": 0.9717, + "mean_token_accuracy": 0.7070391476154327, + "num_tokens": 244348792.0, + "step": 98790 + }, + { + "epoch": 0.9058402860548271, + "learning_rate": 1.883377647382415e-05, + "loss": 0.9616, + "mean_token_accuracy": 0.7171567678451538, + "num_tokens": 244376666.0, + "step": 98800 + }, + { + "epoch": 0.9059319702943064, + "learning_rate": 1.8815439625928304e-05, + "loss": 0.9533, + "mean_token_accuracy": 0.7125464618206024, + "num_tokens": 244404454.0, + "step": 98810 + }, + { + "epoch": 0.9060236545337856, + "learning_rate": 1.8797102778032456e-05, + "loss": 0.9868, + "mean_token_accuracy": 0.7024095237255097, + "num_tokens": 244432600.0, + "step": 98820 + }, + { + "epoch": 0.9061153387732649, + "learning_rate": 1.877876593013661e-05, + "loss": 0.9966, + "mean_token_accuracy": 0.703163868188858, + "num_tokens": 244460141.0, + "step": 98830 + }, + { + "epoch": 0.9062070230127441, + "learning_rate": 1.8760429082240763e-05, + "loss": 0.9545, + "mean_token_accuracy": 0.7115595698356628, + "num_tokens": 244488764.0, + "step": 98840 + }, + { + "epoch": 0.9062987072522234, + "learning_rate": 1.8742092234344915e-05, + "loss": 0.9634, + "mean_token_accuracy": 0.7091646432876587, + "num_tokens": 244516920.0, + "step": 98850 + }, + { + "epoch": 0.9063903914917025, + "learning_rate": 1.872375538644907e-05, + "loss": 0.9697, + "mean_token_accuracy": 0.7015791535377502, + "num_tokens": 244544901.0, + "step": 98860 + }, + { + "epoch": 0.9064820757311818, + "learning_rate": 1.8705418538553222e-05, + "loss": 0.9769, + "mean_token_accuracy": 0.7043940842151641, + "num_tokens": 244573250.0, + "step": 98870 + }, + { + "epoch": 0.906573759970661, + "learning_rate": 1.8687081690657378e-05, + "loss": 0.9802, + "mean_token_accuracy": 0.7076828479766846, + "num_tokens": 244600931.0, + "step": 98880 + }, + { + "epoch": 0.9066654442101403, + "learning_rate": 1.866874484276153e-05, + "loss": 0.9581, + "mean_token_accuracy": 0.7101810514926911, + "num_tokens": 244629485.0, + "step": 98890 + }, + { + "epoch": 0.9067571284496195, + "learning_rate": 1.8650407994865685e-05, + "loss": 0.9765, + "mean_token_accuracy": 0.705142331123352, + "num_tokens": 244657446.0, + "step": 98900 + }, + { + "epoch": 0.9068488126890988, + "learning_rate": 1.8632071146969837e-05, + "loss": 0.954, + "mean_token_accuracy": 0.711612057685852, + "num_tokens": 244685629.0, + "step": 98910 + }, + { + "epoch": 0.906940496928578, + "learning_rate": 1.861373429907399e-05, + "loss": 0.9303, + "mean_token_accuracy": 0.7186287760734558, + "num_tokens": 244713457.0, + "step": 98920 + }, + { + "epoch": 0.9070321811680572, + "learning_rate": 1.8595397451178144e-05, + "loss": 0.9377, + "mean_token_accuracy": 0.7127879858016968, + "num_tokens": 244740850.0, + "step": 98930 + }, + { + "epoch": 0.9071238654075364, + "learning_rate": 1.85770606032823e-05, + "loss": 0.9446, + "mean_token_accuracy": 0.713395619392395, + "num_tokens": 244767394.0, + "step": 98940 + }, + { + "epoch": 0.9072155496470157, + "learning_rate": 1.855872375538645e-05, + "loss": 0.9687, + "mean_token_accuracy": 0.7102888941764831, + "num_tokens": 244795492.0, + "step": 98950 + }, + { + "epoch": 0.9073072338864949, + "learning_rate": 1.8540386907490603e-05, + "loss": 0.9541, + "mean_token_accuracy": 0.7060974717140198, + "num_tokens": 244823023.0, + "step": 98960 + }, + { + "epoch": 0.9073989181259742, + "learning_rate": 1.8522050059594755e-05, + "loss": 0.9743, + "mean_token_accuracy": 0.7049482047557831, + "num_tokens": 244851393.0, + "step": 98970 + }, + { + "epoch": 0.9074906023654534, + "learning_rate": 1.850371321169891e-05, + "loss": 0.9382, + "mean_token_accuracy": 0.7122291028499603, + "num_tokens": 244879127.0, + "step": 98980 + }, + { + "epoch": 0.9075822866049326, + "learning_rate": 1.8485376363803065e-05, + "loss": 0.9678, + "mean_token_accuracy": 0.7073399364948273, + "num_tokens": 244907138.0, + "step": 98990 + }, + { + "epoch": 0.9076739708444118, + "learning_rate": 1.8467039515907217e-05, + "loss": 0.9475, + "mean_token_accuracy": 0.7094966411590576, + "num_tokens": 244934511.0, + "step": 99000 + }, + { + "epoch": 0.9077656550838911, + "learning_rate": 1.844870266801137e-05, + "loss": 0.946, + "mean_token_accuracy": 0.7111939191818237, + "num_tokens": 244962022.0, + "step": 99010 + }, + { + "epoch": 0.9078573393233703, + "learning_rate": 1.843036582011552e-05, + "loss": 1.0062, + "mean_token_accuracy": 0.6980007529258728, + "num_tokens": 244989987.0, + "step": 99020 + }, + { + "epoch": 0.9079490235628496, + "learning_rate": 1.8412028972219676e-05, + "loss": 0.9577, + "mean_token_accuracy": 0.7091847062110901, + "num_tokens": 245018560.0, + "step": 99030 + }, + { + "epoch": 0.9080407078023288, + "learning_rate": 1.839369212432383e-05, + "loss": 0.9409, + "mean_token_accuracy": 0.7124989271163941, + "num_tokens": 245046548.0, + "step": 99040 + }, + { + "epoch": 0.9081323920418081, + "learning_rate": 1.8375355276427983e-05, + "loss": 0.9533, + "mean_token_accuracy": 0.710144329071045, + "num_tokens": 245074974.0, + "step": 99050 + }, + { + "epoch": 0.9082240762812872, + "learning_rate": 1.8357018428532135e-05, + "loss": 0.9767, + "mean_token_accuracy": 0.7003639161586761, + "num_tokens": 245102673.0, + "step": 99060 + }, + { + "epoch": 0.9083157605207665, + "learning_rate": 1.8338681580636287e-05, + "loss": 0.9644, + "mean_token_accuracy": 0.7086762249469757, + "num_tokens": 245131267.0, + "step": 99070 + }, + { + "epoch": 0.9084074447602457, + "learning_rate": 1.8320344732740442e-05, + "loss": 0.984, + "mean_token_accuracy": 0.7076332032680511, + "num_tokens": 245160271.0, + "step": 99080 + }, + { + "epoch": 0.908499128999725, + "learning_rate": 1.8302007884844597e-05, + "loss": 0.9315, + "mean_token_accuracy": 0.7142459034919739, + "num_tokens": 245188732.0, + "step": 99090 + }, + { + "epoch": 0.9085908132392042, + "learning_rate": 1.828367103694875e-05, + "loss": 0.9599, + "mean_token_accuracy": 0.7091251969337463, + "num_tokens": 245216631.0, + "step": 99100 + }, + { + "epoch": 0.9086824974786835, + "learning_rate": 1.82653341890529e-05, + "loss": 0.9498, + "mean_token_accuracy": 0.7134461283683777, + "num_tokens": 245244130.0, + "step": 99110 + }, + { + "epoch": 0.9087741817181626, + "learning_rate": 1.8246997341157056e-05, + "loss": 0.9777, + "mean_token_accuracy": 0.702265340089798, + "num_tokens": 245271220.0, + "step": 99120 + }, + { + "epoch": 0.9088658659576418, + "learning_rate": 1.8228660493261208e-05, + "loss": 0.9438, + "mean_token_accuracy": 0.7100129187107086, + "num_tokens": 245299301.0, + "step": 99130 + }, + { + "epoch": 0.9089575501971211, + "learning_rate": 1.8210323645365363e-05, + "loss": 0.9909, + "mean_token_accuracy": 0.699597829580307, + "num_tokens": 245327480.0, + "step": 99140 + }, + { + "epoch": 0.9090492344366004, + "learning_rate": 1.8191986797469515e-05, + "loss": 0.9541, + "mean_token_accuracy": 0.7078088283538818, + "num_tokens": 245356376.0, + "step": 99150 + }, + { + "epoch": 0.9091409186760796, + "learning_rate": 1.8173649949573667e-05, + "loss": 0.9648, + "mean_token_accuracy": 0.7084352314472199, + "num_tokens": 245383818.0, + "step": 99160 + }, + { + "epoch": 0.9092326029155589, + "learning_rate": 1.8155313101677822e-05, + "loss": 0.9596, + "mean_token_accuracy": 0.7130893707275391, + "num_tokens": 245411880.0, + "step": 99170 + }, + { + "epoch": 0.9093242871550381, + "learning_rate": 1.8136976253781974e-05, + "loss": 0.9689, + "mean_token_accuracy": 0.7035489439964294, + "num_tokens": 245438299.0, + "step": 99180 + }, + { + "epoch": 0.9094159713945172, + "learning_rate": 1.811863940588613e-05, + "loss": 0.9411, + "mean_token_accuracy": 0.7125300884246826, + "num_tokens": 245465862.0, + "step": 99190 + }, + { + "epoch": 0.9095076556339965, + "learning_rate": 1.810030255799028e-05, + "loss": 0.9604, + "mean_token_accuracy": 0.7077223598957062, + "num_tokens": 245495043.0, + "step": 99200 + }, + { + "epoch": 0.9095993398734757, + "learning_rate": 1.8081965710094437e-05, + "loss": 0.9366, + "mean_token_accuracy": 0.7149075448513031, + "num_tokens": 245522478.0, + "step": 99210 + }, + { + "epoch": 0.909691024112955, + "learning_rate": 1.806362886219859e-05, + "loss": 0.9709, + "mean_token_accuracy": 0.7035350382328034, + "num_tokens": 245549466.0, + "step": 99220 + }, + { + "epoch": 0.9097827083524342, + "learning_rate": 1.804529201430274e-05, + "loss": 0.9765, + "mean_token_accuracy": 0.6995810747146607, + "num_tokens": 245578705.0, + "step": 99230 + }, + { + "epoch": 0.9098743925919135, + "learning_rate": 1.8026955166406896e-05, + "loss": 0.9627, + "mean_token_accuracy": 0.7103352427482605, + "num_tokens": 245605976.0, + "step": 99240 + }, + { + "epoch": 0.9099660768313926, + "learning_rate": 1.800861831851105e-05, + "loss": 0.9563, + "mean_token_accuracy": 0.7094795227050781, + "num_tokens": 245633499.0, + "step": 99250 + }, + { + "epoch": 0.9100577610708719, + "learning_rate": 1.7990281470615203e-05, + "loss": 0.9544, + "mean_token_accuracy": 0.7120623230934143, + "num_tokens": 245662205.0, + "step": 99260 + }, + { + "epoch": 0.9101494453103511, + "learning_rate": 1.7971944622719355e-05, + "loss": 0.9688, + "mean_token_accuracy": 0.7137180268764496, + "num_tokens": 245689488.0, + "step": 99270 + }, + { + "epoch": 0.9102411295498304, + "learning_rate": 1.7953607774823507e-05, + "loss": 0.964, + "mean_token_accuracy": 0.708096569776535, + "num_tokens": 245716912.0, + "step": 99280 + }, + { + "epoch": 0.9103328137893096, + "learning_rate": 1.7935270926927662e-05, + "loss": 0.9566, + "mean_token_accuracy": 0.7079792618751526, + "num_tokens": 245745035.0, + "step": 99290 + }, + { + "epoch": 0.9104244980287889, + "learning_rate": 1.7916934079031817e-05, + "loss": 0.9825, + "mean_token_accuracy": 0.7026017665863037, + "num_tokens": 245773141.0, + "step": 99300 + }, + { + "epoch": 0.9105161822682681, + "learning_rate": 1.789859723113597e-05, + "loss": 0.9718, + "mean_token_accuracy": 0.7071141004562378, + "num_tokens": 245801463.0, + "step": 99310 + }, + { + "epoch": 0.9106078665077473, + "learning_rate": 1.788026038324012e-05, + "loss": 0.9458, + "mean_token_accuracy": 0.7118683815002441, + "num_tokens": 245830678.0, + "step": 99320 + }, + { + "epoch": 0.9106995507472265, + "learning_rate": 1.7861923535344273e-05, + "loss": 0.9877, + "mean_token_accuracy": 0.7052164196968078, + "num_tokens": 245858415.0, + "step": 99330 + }, + { + "epoch": 0.9107912349867058, + "learning_rate": 1.784358668744843e-05, + "loss": 0.9943, + "mean_token_accuracy": 0.695398610830307, + "num_tokens": 245886988.0, + "step": 99340 + }, + { + "epoch": 0.910882919226185, + "learning_rate": 1.7825249839552583e-05, + "loss": 0.9179, + "mean_token_accuracy": 0.7180028676986694, + "num_tokens": 245914904.0, + "step": 99350 + }, + { + "epoch": 0.9109746034656643, + "learning_rate": 1.7806912991656735e-05, + "loss": 0.9511, + "mean_token_accuracy": 0.7151628613471985, + "num_tokens": 245942862.0, + "step": 99360 + }, + { + "epoch": 0.9110662877051435, + "learning_rate": 1.7788576143760887e-05, + "loss": 0.9493, + "mean_token_accuracy": 0.7169644296169281, + "num_tokens": 245969861.0, + "step": 99370 + }, + { + "epoch": 0.9111579719446227, + "learning_rate": 1.777023929586504e-05, + "loss": 0.9589, + "mean_token_accuracy": 0.7156728386878968, + "num_tokens": 245998071.0, + "step": 99380 + }, + { + "epoch": 0.9112496561841019, + "learning_rate": 1.7751902447969197e-05, + "loss": 0.9643, + "mean_token_accuracy": 0.7130199491977691, + "num_tokens": 246026673.0, + "step": 99390 + }, + { + "epoch": 0.9113413404235812, + "learning_rate": 1.773356560007335e-05, + "loss": 0.9391, + "mean_token_accuracy": 0.7124180436134339, + "num_tokens": 246055196.0, + "step": 99400 + }, + { + "epoch": 0.9114330246630604, + "learning_rate": 1.77152287521775e-05, + "loss": 0.9396, + "mean_token_accuracy": 0.7146018385887146, + "num_tokens": 246083376.0, + "step": 99410 + }, + { + "epoch": 0.9115247089025397, + "learning_rate": 1.7696891904281653e-05, + "loss": 0.9725, + "mean_token_accuracy": 0.7048784852027893, + "num_tokens": 246111594.0, + "step": 99420 + }, + { + "epoch": 0.9116163931420189, + "learning_rate": 1.767855505638581e-05, + "loss": 0.9431, + "mean_token_accuracy": 0.7131402134895325, + "num_tokens": 246139183.0, + "step": 99430 + }, + { + "epoch": 0.9117080773814982, + "learning_rate": 1.7660218208489964e-05, + "loss": 0.9725, + "mean_token_accuracy": 0.7039356589317322, + "num_tokens": 246167209.0, + "step": 99440 + }, + { + "epoch": 0.9117997616209773, + "learning_rate": 1.7641881360594115e-05, + "loss": 0.955, + "mean_token_accuracy": 0.7087647438049316, + "num_tokens": 246194224.0, + "step": 99450 + }, + { + "epoch": 0.9118914458604566, + "learning_rate": 1.7623544512698267e-05, + "loss": 0.9464, + "mean_token_accuracy": 0.7096237003803253, + "num_tokens": 246221570.0, + "step": 99460 + }, + { + "epoch": 0.9119831300999358, + "learning_rate": 1.760520766480242e-05, + "loss": 0.9595, + "mean_token_accuracy": 0.70811527967453, + "num_tokens": 246250606.0, + "step": 99470 + }, + { + "epoch": 0.9120748143394151, + "learning_rate": 1.7586870816906574e-05, + "loss": 0.9406, + "mean_token_accuracy": 0.7127262830734253, + "num_tokens": 246278513.0, + "step": 99480 + }, + { + "epoch": 0.9121664985788943, + "learning_rate": 1.756853396901073e-05, + "loss": 0.9319, + "mean_token_accuracy": 0.7115866303443908, + "num_tokens": 246307389.0, + "step": 99490 + }, + { + "epoch": 0.9122581828183736, + "learning_rate": 1.755019712111488e-05, + "loss": 0.9756, + "mean_token_accuracy": 0.705430406332016, + "num_tokens": 246334845.0, + "step": 99500 + }, + { + "epoch": 0.9123498670578527, + "learning_rate": 1.7531860273219033e-05, + "loss": 0.9308, + "mean_token_accuracy": 0.7134301126003265, + "num_tokens": 246362959.0, + "step": 99510 + }, + { + "epoch": 0.912441551297332, + "learning_rate": 1.751352342532319e-05, + "loss": 0.9867, + "mean_token_accuracy": 0.703470128774643, + "num_tokens": 246391278.0, + "step": 99520 + }, + { + "epoch": 0.9125332355368112, + "learning_rate": 1.749518657742734e-05, + "loss": 0.9511, + "mean_token_accuracy": 0.7146863520145417, + "num_tokens": 246418411.0, + "step": 99530 + }, + { + "epoch": 0.9126249197762905, + "learning_rate": 1.7476849729531496e-05, + "loss": 0.9828, + "mean_token_accuracy": 0.7031401574611664, + "num_tokens": 246446501.0, + "step": 99540 + }, + { + "epoch": 0.9127166040157697, + "learning_rate": 1.7458512881635648e-05, + "loss": 0.9813, + "mean_token_accuracy": 0.7034123122692109, + "num_tokens": 246474522.0, + "step": 99550 + }, + { + "epoch": 0.912808288255249, + "learning_rate": 1.74401760337398e-05, + "loss": 0.9408, + "mean_token_accuracy": 0.7101796746253968, + "num_tokens": 246503042.0, + "step": 99560 + }, + { + "epoch": 0.9128999724947282, + "learning_rate": 1.7421839185843955e-05, + "loss": 0.9274, + "mean_token_accuracy": 0.7152628660202026, + "num_tokens": 246531643.0, + "step": 99570 + }, + { + "epoch": 0.9129916567342073, + "learning_rate": 1.7403502337948107e-05, + "loss": 0.96, + "mean_token_accuracy": 0.7102968633174896, + "num_tokens": 246560115.0, + "step": 99580 + }, + { + "epoch": 0.9130833409736866, + "learning_rate": 1.7385165490052262e-05, + "loss": 0.9941, + "mean_token_accuracy": 0.6982282519340515, + "num_tokens": 246588271.0, + "step": 99590 + }, + { + "epoch": 0.9131750252131658, + "learning_rate": 1.7366828642156414e-05, + "loss": 0.9507, + "mean_token_accuracy": 0.7108680367469787, + "num_tokens": 246616955.0, + "step": 99600 + }, + { + "epoch": 0.9132667094526451, + "learning_rate": 1.734849179426057e-05, + "loss": 0.9148, + "mean_token_accuracy": 0.7212695956230164, + "num_tokens": 246645517.0, + "step": 99610 + }, + { + "epoch": 0.9133583936921243, + "learning_rate": 1.733015494636472e-05, + "loss": 0.9604, + "mean_token_accuracy": 0.7041295111179352, + "num_tokens": 246673947.0, + "step": 99620 + }, + { + "epoch": 0.9134500779316036, + "learning_rate": 1.7311818098468873e-05, + "loss": 0.9508, + "mean_token_accuracy": 0.7109302341938019, + "num_tokens": 246701153.0, + "step": 99630 + }, + { + "epoch": 0.9135417621710827, + "learning_rate": 1.7293481250573028e-05, + "loss": 0.9308, + "mean_token_accuracy": 0.7114158809185028, + "num_tokens": 246728338.0, + "step": 99640 + }, + { + "epoch": 0.913633446410562, + "learning_rate": 1.7275144402677183e-05, + "loss": 0.9586, + "mean_token_accuracy": 0.7120016038417816, + "num_tokens": 246756496.0, + "step": 99650 + }, + { + "epoch": 0.9137251306500412, + "learning_rate": 1.7256807554781335e-05, + "loss": 0.9286, + "mean_token_accuracy": 0.7170893132686615, + "num_tokens": 246783803.0, + "step": 99660 + }, + { + "epoch": 0.9138168148895205, + "learning_rate": 1.7238470706885487e-05, + "loss": 0.9398, + "mean_token_accuracy": 0.7143398344516754, + "num_tokens": 246810903.0, + "step": 99670 + }, + { + "epoch": 0.9139084991289997, + "learning_rate": 1.722013385898964e-05, + "loss": 0.9505, + "mean_token_accuracy": 0.7043926000595093, + "num_tokens": 246838738.0, + "step": 99680 + }, + { + "epoch": 0.914000183368479, + "learning_rate": 1.7201797011093794e-05, + "loss": 0.9494, + "mean_token_accuracy": 0.7065604150295257, + "num_tokens": 246868248.0, + "step": 99690 + }, + { + "epoch": 0.9140918676079582, + "learning_rate": 1.718346016319795e-05, + "loss": 0.9558, + "mean_token_accuracy": 0.7034044682979583, + "num_tokens": 246896457.0, + "step": 99700 + }, + { + "epoch": 0.9141835518474374, + "learning_rate": 1.71651233153021e-05, + "loss": 0.942, + "mean_token_accuracy": 0.714598786830902, + "num_tokens": 246923841.0, + "step": 99710 + }, + { + "epoch": 0.9142752360869166, + "learning_rate": 1.7146786467406253e-05, + "loss": 0.9386, + "mean_token_accuracy": 0.7097809672355652, + "num_tokens": 246951572.0, + "step": 99720 + }, + { + "epoch": 0.9143669203263959, + "learning_rate": 1.7128449619510405e-05, + "loss": 0.9442, + "mean_token_accuracy": 0.7133966445922851, + "num_tokens": 246980629.0, + "step": 99730 + }, + { + "epoch": 0.9144586045658751, + "learning_rate": 1.711011277161456e-05, + "loss": 0.9581, + "mean_token_accuracy": 0.7073602676391602, + "num_tokens": 247007679.0, + "step": 99740 + }, + { + "epoch": 0.9145502888053544, + "learning_rate": 1.7091775923718716e-05, + "loss": 0.961, + "mean_token_accuracy": 0.7088682174682617, + "num_tokens": 247035494.0, + "step": 99750 + }, + { + "epoch": 0.9146419730448336, + "learning_rate": 1.7073439075822867e-05, + "loss": 0.9605, + "mean_token_accuracy": 0.7071173548698425, + "num_tokens": 247062410.0, + "step": 99760 + }, + { + "epoch": 0.9147336572843128, + "learning_rate": 1.705510222792702e-05, + "loss": 0.9393, + "mean_token_accuracy": 0.7137604415416717, + "num_tokens": 247090463.0, + "step": 99770 + }, + { + "epoch": 0.914825341523792, + "learning_rate": 1.703676538003117e-05, + "loss": 0.9298, + "mean_token_accuracy": 0.718628978729248, + "num_tokens": 247118705.0, + "step": 99780 + }, + { + "epoch": 0.9149170257632713, + "learning_rate": 1.7018428532135326e-05, + "loss": 0.9632, + "mean_token_accuracy": 0.7087247788906097, + "num_tokens": 247146866.0, + "step": 99790 + }, + { + "epoch": 0.9150087100027505, + "learning_rate": 1.700009168423948e-05, + "loss": 0.9252, + "mean_token_accuracy": 0.7173439919948578, + "num_tokens": 247174348.0, + "step": 99800 + }, + { + "epoch": 0.9151003942422298, + "learning_rate": 1.6981754836343633e-05, + "loss": 0.945, + "mean_token_accuracy": 0.7133069396018982, + "num_tokens": 247201025.0, + "step": 99810 + }, + { + "epoch": 0.915192078481709, + "learning_rate": 1.6963417988447785e-05, + "loss": 0.9693, + "mean_token_accuracy": 0.7048952162265778, + "num_tokens": 247227932.0, + "step": 99820 + }, + { + "epoch": 0.9152837627211883, + "learning_rate": 1.694508114055194e-05, + "loss": 0.9652, + "mean_token_accuracy": 0.703224265575409, + "num_tokens": 247256143.0, + "step": 99830 + }, + { + "epoch": 0.9153754469606674, + "learning_rate": 1.6926744292656092e-05, + "loss": 0.9858, + "mean_token_accuracy": 0.7009982287883758, + "num_tokens": 247284651.0, + "step": 99840 + }, + { + "epoch": 0.9154671312001467, + "learning_rate": 1.6908407444760248e-05, + "loss": 0.9349, + "mean_token_accuracy": 0.719301962852478, + "num_tokens": 247312168.0, + "step": 99850 + }, + { + "epoch": 0.9155588154396259, + "learning_rate": 1.68900705968644e-05, + "loss": 0.9543, + "mean_token_accuracy": 0.7073159754276276, + "num_tokens": 247339562.0, + "step": 99860 + }, + { + "epoch": 0.9156504996791052, + "learning_rate": 1.687173374896855e-05, + "loss": 0.9736, + "mean_token_accuracy": 0.7037499010562897, + "num_tokens": 247367591.0, + "step": 99870 + }, + { + "epoch": 0.9157421839185844, + "learning_rate": 1.6853396901072707e-05, + "loss": 0.9568, + "mean_token_accuracy": 0.710649061203003, + "num_tokens": 247394895.0, + "step": 99880 + }, + { + "epoch": 0.9158338681580637, + "learning_rate": 1.683506005317686e-05, + "loss": 0.9364, + "mean_token_accuracy": 0.716763186454773, + "num_tokens": 247421838.0, + "step": 99890 + }, + { + "epoch": 0.9159255523975428, + "learning_rate": 1.6816723205281014e-05, + "loss": 0.9384, + "mean_token_accuracy": 0.7132778227329254, + "num_tokens": 247449576.0, + "step": 99900 + }, + { + "epoch": 0.9160172366370221, + "learning_rate": 1.6798386357385166e-05, + "loss": 0.9398, + "mean_token_accuracy": 0.7177938222885132, + "num_tokens": 247476638.0, + "step": 99910 + }, + { + "epoch": 0.9161089208765013, + "learning_rate": 1.678004950948932e-05, + "loss": 0.9669, + "mean_token_accuracy": 0.7109892904758454, + "num_tokens": 247504955.0, + "step": 99920 + }, + { + "epoch": 0.9162006051159806, + "learning_rate": 1.6761712661593473e-05, + "loss": 0.953, + "mean_token_accuracy": 0.7131851136684417, + "num_tokens": 247532364.0, + "step": 99930 + }, + { + "epoch": 0.9162922893554598, + "learning_rate": 1.6743375813697625e-05, + "loss": 0.9645, + "mean_token_accuracy": 0.7099905014038086, + "num_tokens": 247560532.0, + "step": 99940 + }, + { + "epoch": 0.9163839735949391, + "learning_rate": 1.672503896580178e-05, + "loss": 0.9669, + "mean_token_accuracy": 0.7084422290325165, + "num_tokens": 247588427.0, + "step": 99950 + }, + { + "epoch": 0.9164756578344183, + "learning_rate": 1.6706702117905935e-05, + "loss": 0.9606, + "mean_token_accuracy": 0.7048634946346283, + "num_tokens": 247616600.0, + "step": 99960 + }, + { + "epoch": 0.9165673420738975, + "learning_rate": 1.6688365270010087e-05, + "loss": 0.9683, + "mean_token_accuracy": 0.7047381281852723, + "num_tokens": 247644520.0, + "step": 99970 + }, + { + "epoch": 0.9166590263133767, + "learning_rate": 1.667002842211424e-05, + "loss": 0.9759, + "mean_token_accuracy": 0.7052361905574799, + "num_tokens": 247672647.0, + "step": 99980 + }, + { + "epoch": 0.916750710552856, + "learning_rate": 1.665169157421839e-05, + "loss": 0.9489, + "mean_token_accuracy": 0.7082134187221527, + "num_tokens": 247700084.0, + "step": 99990 + }, + { + "epoch": 0.9168423947923352, + "learning_rate": 1.6633354726322546e-05, + "loss": 0.9397, + "mean_token_accuracy": 0.7144883096218109, + "num_tokens": 247727674.0, + "step": 100000 + }, + { + "epoch": 0.9169340790318145, + "learning_rate": 1.66150178784267e-05, + "loss": 0.9367, + "mean_token_accuracy": 0.7193460941314698, + "num_tokens": 247755286.0, + "step": 100010 + }, + { + "epoch": 0.9170257632712937, + "learning_rate": 1.6596681030530853e-05, + "loss": 0.9658, + "mean_token_accuracy": 0.7092611610889434, + "num_tokens": 247783728.0, + "step": 100020 + }, + { + "epoch": 0.9171174475107728, + "learning_rate": 1.6578344182635005e-05, + "loss": 0.976, + "mean_token_accuracy": 0.704130619764328, + "num_tokens": 247811777.0, + "step": 100030 + }, + { + "epoch": 0.9172091317502521, + "learning_rate": 1.6560007334739157e-05, + "loss": 0.9499, + "mean_token_accuracy": 0.715839284658432, + "num_tokens": 247840103.0, + "step": 100040 + }, + { + "epoch": 0.9173008159897313, + "learning_rate": 1.6541670486843312e-05, + "loss": 0.9467, + "mean_token_accuracy": 0.7104815423488617, + "num_tokens": 247867476.0, + "step": 100050 + }, + { + "epoch": 0.9173925002292106, + "learning_rate": 1.6523333638947467e-05, + "loss": 0.9482, + "mean_token_accuracy": 0.7036938011646271, + "num_tokens": 247894941.0, + "step": 100060 + }, + { + "epoch": 0.9174841844686898, + "learning_rate": 1.650499679105162e-05, + "loss": 0.941, + "mean_token_accuracy": 0.711452579498291, + "num_tokens": 247923325.0, + "step": 100070 + }, + { + "epoch": 0.9175758687081691, + "learning_rate": 1.648665994315577e-05, + "loss": 0.9682, + "mean_token_accuracy": 0.7044674515724182, + "num_tokens": 247951961.0, + "step": 100080 + }, + { + "epoch": 0.9176675529476483, + "learning_rate": 1.6468323095259923e-05, + "loss": 0.9615, + "mean_token_accuracy": 0.7075078308582305, + "num_tokens": 247981138.0, + "step": 100090 + }, + { + "epoch": 0.9177592371871275, + "learning_rate": 1.6449986247364078e-05, + "loss": 0.9681, + "mean_token_accuracy": 0.7054571211338043, + "num_tokens": 248009302.0, + "step": 100100 + }, + { + "epoch": 0.9178509214266067, + "learning_rate": 1.6431649399468234e-05, + "loss": 0.9577, + "mean_token_accuracy": 0.7064182341098786, + "num_tokens": 248037454.0, + "step": 100110 + }, + { + "epoch": 0.917942605666086, + "learning_rate": 1.6413312551572385e-05, + "loss": 0.9564, + "mean_token_accuracy": 0.707996416091919, + "num_tokens": 248064480.0, + "step": 100120 + }, + { + "epoch": 0.9180342899055652, + "learning_rate": 1.6394975703676537e-05, + "loss": 0.9554, + "mean_token_accuracy": 0.7101505339145661, + "num_tokens": 248092366.0, + "step": 100130 + }, + { + "epoch": 0.9181259741450445, + "learning_rate": 1.6376638855780693e-05, + "loss": 0.95, + "mean_token_accuracy": 0.7134077310562134, + "num_tokens": 248119625.0, + "step": 100140 + }, + { + "epoch": 0.9182176583845237, + "learning_rate": 1.6358302007884844e-05, + "loss": 0.9784, + "mean_token_accuracy": 0.7073571622371674, + "num_tokens": 248147521.0, + "step": 100150 + }, + { + "epoch": 0.918309342624003, + "learning_rate": 1.6339965159989e-05, + "loss": 0.9642, + "mean_token_accuracy": 0.7048455774784088, + "num_tokens": 248174983.0, + "step": 100160 + }, + { + "epoch": 0.9184010268634821, + "learning_rate": 1.632162831209315e-05, + "loss": 0.9473, + "mean_token_accuracy": 0.713927811384201, + "num_tokens": 248203396.0, + "step": 100170 + }, + { + "epoch": 0.9184927111029614, + "learning_rate": 1.6303291464197303e-05, + "loss": 0.9453, + "mean_token_accuracy": 0.7139868080615998, + "num_tokens": 248230782.0, + "step": 100180 + }, + { + "epoch": 0.9185843953424406, + "learning_rate": 1.628495461630146e-05, + "loss": 0.9569, + "mean_token_accuracy": 0.7076826691627502, + "num_tokens": 248258475.0, + "step": 100190 + }, + { + "epoch": 0.9186760795819199, + "learning_rate": 1.626661776840561e-05, + "loss": 0.9595, + "mean_token_accuracy": 0.708940851688385, + "num_tokens": 248286546.0, + "step": 100200 + }, + { + "epoch": 0.9187677638213991, + "learning_rate": 1.6248280920509766e-05, + "loss": 0.9509, + "mean_token_accuracy": 0.7117028594017029, + "num_tokens": 248314924.0, + "step": 100210 + }, + { + "epoch": 0.9188594480608784, + "learning_rate": 1.6229944072613918e-05, + "loss": 0.9577, + "mean_token_accuracy": 0.7107714116573334, + "num_tokens": 248343404.0, + "step": 100220 + }, + { + "epoch": 0.9189511323003575, + "learning_rate": 1.6211607224718073e-05, + "loss": 0.9226, + "mean_token_accuracy": 0.7155018031597138, + "num_tokens": 248371074.0, + "step": 100230 + }, + { + "epoch": 0.9190428165398368, + "learning_rate": 1.6193270376822225e-05, + "loss": 0.9863, + "mean_token_accuracy": 0.7039390444755554, + "num_tokens": 248398758.0, + "step": 100240 + }, + { + "epoch": 0.919134500779316, + "learning_rate": 1.6174933528926377e-05, + "loss": 0.9752, + "mean_token_accuracy": 0.7047863602638245, + "num_tokens": 248426748.0, + "step": 100250 + }, + { + "epoch": 0.9192261850187953, + "learning_rate": 1.6156596681030532e-05, + "loss": 0.9636, + "mean_token_accuracy": 0.7020634472370147, + "num_tokens": 248454586.0, + "step": 100260 + }, + { + "epoch": 0.9193178692582745, + "learning_rate": 1.6138259833134687e-05, + "loss": 0.978, + "mean_token_accuracy": 0.7049915015697479, + "num_tokens": 248482809.0, + "step": 100270 + }, + { + "epoch": 0.9194095534977538, + "learning_rate": 1.611992298523884e-05, + "loss": 0.96, + "mean_token_accuracy": 0.7088077008724213, + "num_tokens": 248511108.0, + "step": 100280 + }, + { + "epoch": 0.919501237737233, + "learning_rate": 1.610158613734299e-05, + "loss": 0.9377, + "mean_token_accuracy": 0.7143801927566529, + "num_tokens": 248538791.0, + "step": 100290 + }, + { + "epoch": 0.9195929219767122, + "learning_rate": 1.6083249289447143e-05, + "loss": 1.0013, + "mean_token_accuracy": 0.702047199010849, + "num_tokens": 248567153.0, + "step": 100300 + }, + { + "epoch": 0.9196846062161914, + "learning_rate": 1.6064912441551298e-05, + "loss": 0.9588, + "mean_token_accuracy": 0.7086064577102661, + "num_tokens": 248594810.0, + "step": 100310 + }, + { + "epoch": 0.9197762904556707, + "learning_rate": 1.6046575593655453e-05, + "loss": 0.9497, + "mean_token_accuracy": 0.7123761355876923, + "num_tokens": 248622865.0, + "step": 100320 + }, + { + "epoch": 0.9198679746951499, + "learning_rate": 1.6028238745759605e-05, + "loss": 0.9697, + "mean_token_accuracy": 0.7054692029953002, + "num_tokens": 248649871.0, + "step": 100330 + }, + { + "epoch": 0.9199596589346292, + "learning_rate": 1.6009901897863757e-05, + "loss": 0.9767, + "mean_token_accuracy": 0.7065792143344879, + "num_tokens": 248678583.0, + "step": 100340 + }, + { + "epoch": 0.9200513431741084, + "learning_rate": 1.599156504996791e-05, + "loss": 0.9758, + "mean_token_accuracy": 0.7048300802707672, + "num_tokens": 248706543.0, + "step": 100350 + }, + { + "epoch": 0.9201430274135876, + "learning_rate": 1.5973228202072068e-05, + "loss": 0.9153, + "mean_token_accuracy": 0.7165494084358215, + "num_tokens": 248734240.0, + "step": 100360 + }, + { + "epoch": 0.9202347116530668, + "learning_rate": 1.595489135417622e-05, + "loss": 0.9482, + "mean_token_accuracy": 0.7105397284030914, + "num_tokens": 248762583.0, + "step": 100370 + }, + { + "epoch": 0.9203263958925461, + "learning_rate": 1.593655450628037e-05, + "loss": 0.9528, + "mean_token_accuracy": 0.7131660044193268, + "num_tokens": 248790061.0, + "step": 100380 + }, + { + "epoch": 0.9204180801320253, + "learning_rate": 1.5918217658384523e-05, + "loss": 0.9914, + "mean_token_accuracy": 0.7015332520008087, + "num_tokens": 248817815.0, + "step": 100390 + }, + { + "epoch": 0.9205097643715046, + "learning_rate": 1.5899880810488675e-05, + "loss": 0.9368, + "mean_token_accuracy": 0.7151429891586304, + "num_tokens": 248846376.0, + "step": 100400 + }, + { + "epoch": 0.9206014486109838, + "learning_rate": 1.5881543962592834e-05, + "loss": 0.9636, + "mean_token_accuracy": 0.7101771891117096, + "num_tokens": 248874429.0, + "step": 100410 + }, + { + "epoch": 0.9206931328504631, + "learning_rate": 1.5863207114696985e-05, + "loss": 0.9803, + "mean_token_accuracy": 0.7020486354827881, + "num_tokens": 248902431.0, + "step": 100420 + }, + { + "epoch": 0.9207848170899422, + "learning_rate": 1.5844870266801137e-05, + "loss": 0.9452, + "mean_token_accuracy": 0.717402845621109, + "num_tokens": 248930897.0, + "step": 100430 + }, + { + "epoch": 0.9208765013294214, + "learning_rate": 1.582653341890529e-05, + "loss": 0.9368, + "mean_token_accuracy": 0.7192105889320374, + "num_tokens": 248958107.0, + "step": 100440 + }, + { + "epoch": 0.9209681855689007, + "learning_rate": 1.5808196571009444e-05, + "loss": 0.9564, + "mean_token_accuracy": 0.7145209670066833, + "num_tokens": 248986624.0, + "step": 100450 + }, + { + "epoch": 0.92105986980838, + "learning_rate": 1.57898597231136e-05, + "loss": 0.9729, + "mean_token_accuracy": 0.7003249943256378, + "num_tokens": 249015154.0, + "step": 100460 + }, + { + "epoch": 0.9211515540478592, + "learning_rate": 1.577152287521775e-05, + "loss": 0.9657, + "mean_token_accuracy": 0.7100578725337983, + "num_tokens": 249043422.0, + "step": 100470 + }, + { + "epoch": 0.9212432382873385, + "learning_rate": 1.5753186027321903e-05, + "loss": 0.9685, + "mean_token_accuracy": 0.705563622713089, + "num_tokens": 249070893.0, + "step": 100480 + }, + { + "epoch": 0.9213349225268176, + "learning_rate": 1.5734849179426055e-05, + "loss": 0.9303, + "mean_token_accuracy": 0.7130422115325927, + "num_tokens": 249099313.0, + "step": 100490 + }, + { + "epoch": 0.9214266067662968, + "learning_rate": 1.571651233153021e-05, + "loss": 0.945, + "mean_token_accuracy": 0.7152499079704284, + "num_tokens": 249127599.0, + "step": 100500 + }, + { + "epoch": 0.9215182910057761, + "learning_rate": 1.5698175483634366e-05, + "loss": 0.9557, + "mean_token_accuracy": 0.7070723831653595, + "num_tokens": 249155063.0, + "step": 100510 + }, + { + "epoch": 0.9216099752452553, + "learning_rate": 1.5679838635738518e-05, + "loss": 0.9533, + "mean_token_accuracy": 0.7138455748558045, + "num_tokens": 249182490.0, + "step": 100520 + }, + { + "epoch": 0.9217016594847346, + "learning_rate": 1.566150178784267e-05, + "loss": 0.961, + "mean_token_accuracy": 0.705112737417221, + "num_tokens": 249211041.0, + "step": 100530 + }, + { + "epoch": 0.9217933437242138, + "learning_rate": 1.5643164939946825e-05, + "loss": 0.9465, + "mean_token_accuracy": 0.7117710888385773, + "num_tokens": 249239833.0, + "step": 100540 + }, + { + "epoch": 0.9218850279636931, + "learning_rate": 1.5624828092050977e-05, + "loss": 0.9996, + "mean_token_accuracy": 0.6976643860340118, + "num_tokens": 249268502.0, + "step": 100550 + }, + { + "epoch": 0.9219767122031722, + "learning_rate": 1.5606491244155132e-05, + "loss": 0.9607, + "mean_token_accuracy": 0.7141707420349122, + "num_tokens": 249296653.0, + "step": 100560 + }, + { + "epoch": 0.9220683964426515, + "learning_rate": 1.5588154396259284e-05, + "loss": 0.9231, + "mean_token_accuracy": 0.7176756381988525, + "num_tokens": 249323642.0, + "step": 100570 + }, + { + "epoch": 0.9221600806821307, + "learning_rate": 1.556981754836344e-05, + "loss": 0.9516, + "mean_token_accuracy": 0.7097282767295837, + "num_tokens": 249352347.0, + "step": 100580 + }, + { + "epoch": 0.92225176492161, + "learning_rate": 1.555148070046759e-05, + "loss": 0.9485, + "mean_token_accuracy": 0.7109363079071045, + "num_tokens": 249381443.0, + "step": 100590 + }, + { + "epoch": 0.9223434491610892, + "learning_rate": 1.5533143852571743e-05, + "loss": 0.9792, + "mean_token_accuracy": 0.6996920287609101, + "num_tokens": 249409473.0, + "step": 100600 + }, + { + "epoch": 0.9224351334005685, + "learning_rate": 1.5514807004675898e-05, + "loss": 0.968, + "mean_token_accuracy": 0.7075730323791504, + "num_tokens": 249437197.0, + "step": 100610 + }, + { + "epoch": 0.9225268176400476, + "learning_rate": 1.549647015678005e-05, + "loss": 0.9445, + "mean_token_accuracy": 0.7086631119251251, + "num_tokens": 249464874.0, + "step": 100620 + }, + { + "epoch": 0.9226185018795269, + "learning_rate": 1.5478133308884205e-05, + "loss": 0.9476, + "mean_token_accuracy": 0.713670402765274, + "num_tokens": 249492726.0, + "step": 100630 + }, + { + "epoch": 0.9227101861190061, + "learning_rate": 1.5459796460988357e-05, + "loss": 0.9602, + "mean_token_accuracy": 0.7114905118942261, + "num_tokens": 249519502.0, + "step": 100640 + }, + { + "epoch": 0.9228018703584854, + "learning_rate": 1.544145961309251e-05, + "loss": 0.9772, + "mean_token_accuracy": 0.7055188179016113, + "num_tokens": 249546660.0, + "step": 100650 + }, + { + "epoch": 0.9228935545979646, + "learning_rate": 1.5423122765196664e-05, + "loss": 0.9126, + "mean_token_accuracy": 0.7191270232200623, + "num_tokens": 249574683.0, + "step": 100660 + }, + { + "epoch": 0.9229852388374439, + "learning_rate": 1.540478591730082e-05, + "loss": 0.9692, + "mean_token_accuracy": 0.7035593748092651, + "num_tokens": 249603450.0, + "step": 100670 + }, + { + "epoch": 0.9230769230769231, + "learning_rate": 1.538644906940497e-05, + "loss": 0.9328, + "mean_token_accuracy": 0.7143905282020568, + "num_tokens": 249630873.0, + "step": 100680 + }, + { + "epoch": 0.9231686073164023, + "learning_rate": 1.5368112221509123e-05, + "loss": 0.9709, + "mean_token_accuracy": 0.7070143282413482, + "num_tokens": 249659458.0, + "step": 100690 + }, + { + "epoch": 0.9232602915558815, + "learning_rate": 1.5349775373613275e-05, + "loss": 0.9417, + "mean_token_accuracy": 0.7143168449401855, + "num_tokens": 249686948.0, + "step": 100700 + }, + { + "epoch": 0.9233519757953608, + "learning_rate": 1.533143852571743e-05, + "loss": 0.9728, + "mean_token_accuracy": 0.7064504802227021, + "num_tokens": 249714505.0, + "step": 100710 + }, + { + "epoch": 0.92344366003484, + "learning_rate": 1.5313101677821586e-05, + "loss": 0.9597, + "mean_token_accuracy": 0.7091737151145935, + "num_tokens": 249742298.0, + "step": 100720 + }, + { + "epoch": 0.9235353442743193, + "learning_rate": 1.5294764829925737e-05, + "loss": 0.9315, + "mean_token_accuracy": 0.7164255201816558, + "num_tokens": 249769413.0, + "step": 100730 + }, + { + "epoch": 0.9236270285137985, + "learning_rate": 1.527642798202989e-05, + "loss": 0.9574, + "mean_token_accuracy": 0.7113082051277161, + "num_tokens": 249797908.0, + "step": 100740 + }, + { + "epoch": 0.9237187127532777, + "learning_rate": 1.5258091134134043e-05, + "loss": 0.9512, + "mean_token_accuracy": 0.7109612941741943, + "num_tokens": 249825695.0, + "step": 100750 + }, + { + "epoch": 0.9238103969927569, + "learning_rate": 1.5239754286238198e-05, + "loss": 0.9481, + "mean_token_accuracy": 0.708267605304718, + "num_tokens": 249853543.0, + "step": 100760 + }, + { + "epoch": 0.9239020812322362, + "learning_rate": 1.522141743834235e-05, + "loss": 0.928, + "mean_token_accuracy": 0.7176929891109467, + "num_tokens": 249881404.0, + "step": 100770 + }, + { + "epoch": 0.9239937654717154, + "learning_rate": 1.5203080590446504e-05, + "loss": 0.9938, + "mean_token_accuracy": 0.6983058214187622, + "num_tokens": 249909254.0, + "step": 100780 + }, + { + "epoch": 0.9240854497111947, + "learning_rate": 1.5184743742550655e-05, + "loss": 0.9379, + "mean_token_accuracy": 0.7137408256530762, + "num_tokens": 249936898.0, + "step": 100790 + }, + { + "epoch": 0.9241771339506739, + "learning_rate": 1.5166406894654809e-05, + "loss": 0.9425, + "mean_token_accuracy": 0.716493946313858, + "num_tokens": 249964352.0, + "step": 100800 + }, + { + "epoch": 0.9242688181901532, + "learning_rate": 1.5148070046758964e-05, + "loss": 0.9716, + "mean_token_accuracy": 0.7079392313957215, + "num_tokens": 249992129.0, + "step": 100810 + }, + { + "epoch": 0.9243605024296323, + "learning_rate": 1.5129733198863116e-05, + "loss": 0.9452, + "mean_token_accuracy": 0.7150243043899536, + "num_tokens": 250020345.0, + "step": 100820 + }, + { + "epoch": 0.9244521866691116, + "learning_rate": 1.511139635096727e-05, + "loss": 0.9529, + "mean_token_accuracy": 0.709873503446579, + "num_tokens": 250048073.0, + "step": 100830 + }, + { + "epoch": 0.9245438709085908, + "learning_rate": 1.5093059503071422e-05, + "loss": 0.9575, + "mean_token_accuracy": 0.7116186380386352, + "num_tokens": 250076032.0, + "step": 100840 + }, + { + "epoch": 0.92463555514807, + "learning_rate": 1.5074722655175577e-05, + "loss": 0.9589, + "mean_token_accuracy": 0.7067624449729919, + "num_tokens": 250104165.0, + "step": 100850 + }, + { + "epoch": 0.9247272393875493, + "learning_rate": 1.505638580727973e-05, + "loss": 0.9384, + "mean_token_accuracy": 0.7108546733856201, + "num_tokens": 250132564.0, + "step": 100860 + }, + { + "epoch": 0.9248189236270286, + "learning_rate": 1.5038048959383882e-05, + "loss": 0.9858, + "mean_token_accuracy": 0.7066552817821503, + "num_tokens": 250160719.0, + "step": 100870 + }, + { + "epoch": 0.9249106078665077, + "learning_rate": 1.5019712111488036e-05, + "loss": 0.9681, + "mean_token_accuracy": 0.7042514204978942, + "num_tokens": 250188000.0, + "step": 100880 + }, + { + "epoch": 0.925002292105987, + "learning_rate": 1.5001375263592191e-05, + "loss": 0.9345, + "mean_token_accuracy": 0.7192918658256531, + "num_tokens": 250216120.0, + "step": 100890 + }, + { + "epoch": 0.9250939763454662, + "learning_rate": 1.4983038415696343e-05, + "loss": 0.9579, + "mean_token_accuracy": 0.7102409124374389, + "num_tokens": 250243980.0, + "step": 100900 + }, + { + "epoch": 0.9251856605849454, + "learning_rate": 1.4964701567800496e-05, + "loss": 0.9587, + "mean_token_accuracy": 0.7072044909000397, + "num_tokens": 250271061.0, + "step": 100910 + }, + { + "epoch": 0.9252773448244247, + "learning_rate": 1.4946364719904648e-05, + "loss": 0.9673, + "mean_token_accuracy": 0.7044660568237304, + "num_tokens": 250298980.0, + "step": 100920 + }, + { + "epoch": 0.925369029063904, + "learning_rate": 1.4928027872008802e-05, + "loss": 0.9743, + "mean_token_accuracy": 0.7075785040855408, + "num_tokens": 250327253.0, + "step": 100930 + }, + { + "epoch": 0.9254607133033832, + "learning_rate": 1.4909691024112957e-05, + "loss": 0.9603, + "mean_token_accuracy": 0.7101104617118835, + "num_tokens": 250355145.0, + "step": 100940 + }, + { + "epoch": 0.9255523975428623, + "learning_rate": 1.4891354176217109e-05, + "loss": 0.9607, + "mean_token_accuracy": 0.7078048586845398, + "num_tokens": 250382940.0, + "step": 100950 + }, + { + "epoch": 0.9256440817823416, + "learning_rate": 1.4873017328321263e-05, + "loss": 0.9457, + "mean_token_accuracy": 0.7161997199058533, + "num_tokens": 250410482.0, + "step": 100960 + }, + { + "epoch": 0.9257357660218208, + "learning_rate": 1.4854680480425414e-05, + "loss": 0.9501, + "mean_token_accuracy": 0.709575068950653, + "num_tokens": 250439187.0, + "step": 100970 + }, + { + "epoch": 0.9258274502613001, + "learning_rate": 1.483634363252957e-05, + "loss": 0.9398, + "mean_token_accuracy": 0.7123695969581604, + "num_tokens": 250467911.0, + "step": 100980 + }, + { + "epoch": 0.9259191345007793, + "learning_rate": 1.4818006784633723e-05, + "loss": 0.9891, + "mean_token_accuracy": 0.6986816644668579, + "num_tokens": 250496091.0, + "step": 100990 + }, + { + "epoch": 0.9260108187402586, + "learning_rate": 1.4799669936737875e-05, + "loss": 0.9414, + "mean_token_accuracy": 0.7116996347904205, + "num_tokens": 250524262.0, + "step": 101000 + }, + { + "epoch": 0.9261025029797377, + "learning_rate": 1.4781333088842029e-05, + "loss": 0.9509, + "mean_token_accuracy": 0.7090371906757355, + "num_tokens": 250551630.0, + "step": 101010 + }, + { + "epoch": 0.926194187219217, + "learning_rate": 1.476299624094618e-05, + "loss": 0.9518, + "mean_token_accuracy": 0.7161370575428009, + "num_tokens": 250579426.0, + "step": 101020 + }, + { + "epoch": 0.9262858714586962, + "learning_rate": 1.4744659393050336e-05, + "loss": 0.9847, + "mean_token_accuracy": 0.6985947608947753, + "num_tokens": 250607037.0, + "step": 101030 + }, + { + "epoch": 0.9263775556981755, + "learning_rate": 1.472632254515449e-05, + "loss": 0.9642, + "mean_token_accuracy": 0.7043582618236541, + "num_tokens": 250635378.0, + "step": 101040 + }, + { + "epoch": 0.9264692399376547, + "learning_rate": 1.4707985697258641e-05, + "loss": 0.9693, + "mean_token_accuracy": 0.7046302676200866, + "num_tokens": 250663272.0, + "step": 101050 + }, + { + "epoch": 0.926560924177134, + "learning_rate": 1.4689648849362795e-05, + "loss": 0.9678, + "mean_token_accuracy": 0.7033112704753876, + "num_tokens": 250690883.0, + "step": 101060 + }, + { + "epoch": 0.9266526084166132, + "learning_rate": 1.467131200146695e-05, + "loss": 0.9315, + "mean_token_accuracy": 0.7134780585765839, + "num_tokens": 250719225.0, + "step": 101070 + }, + { + "epoch": 0.9267442926560924, + "learning_rate": 1.4652975153571102e-05, + "loss": 0.9579, + "mean_token_accuracy": 0.7079670011997223, + "num_tokens": 250747249.0, + "step": 101080 + }, + { + "epoch": 0.9268359768955716, + "learning_rate": 1.4634638305675255e-05, + "loss": 0.9559, + "mean_token_accuracy": 0.706309849023819, + "num_tokens": 250775586.0, + "step": 101090 + }, + { + "epoch": 0.9269276611350509, + "learning_rate": 1.4616301457779407e-05, + "loss": 0.9361, + "mean_token_accuracy": 0.7131204187870026, + "num_tokens": 250803850.0, + "step": 101100 + }, + { + "epoch": 0.9270193453745301, + "learning_rate": 1.4597964609883561e-05, + "loss": 0.9526, + "mean_token_accuracy": 0.7098627209663391, + "num_tokens": 250832286.0, + "step": 101110 + }, + { + "epoch": 0.9271110296140094, + "learning_rate": 1.4579627761987716e-05, + "loss": 0.9641, + "mean_token_accuracy": 0.7075021147727967, + "num_tokens": 250861050.0, + "step": 101120 + }, + { + "epoch": 0.9272027138534886, + "learning_rate": 1.4561290914091868e-05, + "loss": 0.9672, + "mean_token_accuracy": 0.7055325388908387, + "num_tokens": 250889481.0, + "step": 101130 + }, + { + "epoch": 0.9272943980929678, + "learning_rate": 1.4542954066196022e-05, + "loss": 0.9304, + "mean_token_accuracy": 0.7094467341899872, + "num_tokens": 250916663.0, + "step": 101140 + }, + { + "epoch": 0.927386082332447, + "learning_rate": 1.4524617218300173e-05, + "loss": 0.9571, + "mean_token_accuracy": 0.7061554670333863, + "num_tokens": 250944766.0, + "step": 101150 + }, + { + "epoch": 0.9274777665719263, + "learning_rate": 1.4506280370404329e-05, + "loss": 0.9345, + "mean_token_accuracy": 0.7128243148326874, + "num_tokens": 250972471.0, + "step": 101160 + }, + { + "epoch": 0.9275694508114055, + "learning_rate": 1.4487943522508482e-05, + "loss": 0.9532, + "mean_token_accuracy": 0.7105517029762268, + "num_tokens": 250999623.0, + "step": 101170 + }, + { + "epoch": 0.9276611350508848, + "learning_rate": 1.4469606674612634e-05, + "loss": 0.9549, + "mean_token_accuracy": 0.7110942423343658, + "num_tokens": 251026727.0, + "step": 101180 + }, + { + "epoch": 0.927752819290364, + "learning_rate": 1.4451269826716788e-05, + "loss": 0.9394, + "mean_token_accuracy": 0.7118489742279053, + "num_tokens": 251054410.0, + "step": 101190 + }, + { + "epoch": 0.9278445035298433, + "learning_rate": 1.4432932978820943e-05, + "loss": 0.9458, + "mean_token_accuracy": 0.7079277634620667, + "num_tokens": 251082805.0, + "step": 101200 + }, + { + "epoch": 0.9279361877693224, + "learning_rate": 1.4414596130925095e-05, + "loss": 0.9575, + "mean_token_accuracy": 0.7132249712944031, + "num_tokens": 251112012.0, + "step": 101210 + }, + { + "epoch": 0.9280278720088017, + "learning_rate": 1.4396259283029248e-05, + "loss": 0.9675, + "mean_token_accuracy": 0.7074493169784546, + "num_tokens": 251139131.0, + "step": 101220 + }, + { + "epoch": 0.9281195562482809, + "learning_rate": 1.43779224351334e-05, + "loss": 0.9465, + "mean_token_accuracy": 0.7088360667228699, + "num_tokens": 251167332.0, + "step": 101230 + }, + { + "epoch": 0.9282112404877602, + "learning_rate": 1.4359585587237554e-05, + "loss": 0.9377, + "mean_token_accuracy": 0.7143978297710418, + "num_tokens": 251194765.0, + "step": 101240 + }, + { + "epoch": 0.9283029247272394, + "learning_rate": 1.4341248739341709e-05, + "loss": 0.9561, + "mean_token_accuracy": 0.7093397915363312, + "num_tokens": 251222159.0, + "step": 101250 + }, + { + "epoch": 0.9283946089667187, + "learning_rate": 1.4322911891445861e-05, + "loss": 0.9245, + "mean_token_accuracy": 0.7178255259990692, + "num_tokens": 251249107.0, + "step": 101260 + }, + { + "epoch": 0.9284862932061978, + "learning_rate": 1.4304575043550015e-05, + "loss": 0.9749, + "mean_token_accuracy": 0.7051239430904388, + "num_tokens": 251277101.0, + "step": 101270 + }, + { + "epoch": 0.928577977445677, + "learning_rate": 1.4286238195654166e-05, + "loss": 0.9612, + "mean_token_accuracy": 0.7061001837253571, + "num_tokens": 251304552.0, + "step": 101280 + }, + { + "epoch": 0.9286696616851563, + "learning_rate": 1.4267901347758322e-05, + "loss": 0.9647, + "mean_token_accuracy": 0.7067552268505096, + "num_tokens": 251332198.0, + "step": 101290 + }, + { + "epoch": 0.9287613459246356, + "learning_rate": 1.4249564499862475e-05, + "loss": 0.9469, + "mean_token_accuracy": 0.7085455417633056, + "num_tokens": 251360424.0, + "step": 101300 + }, + { + "epoch": 0.9288530301641148, + "learning_rate": 1.4231227651966627e-05, + "loss": 0.9734, + "mean_token_accuracy": 0.7017104625701904, + "num_tokens": 251388581.0, + "step": 101310 + }, + { + "epoch": 0.928944714403594, + "learning_rate": 1.421289080407078e-05, + "loss": 0.9634, + "mean_token_accuracy": 0.7036072313785553, + "num_tokens": 251416086.0, + "step": 101320 + }, + { + "epoch": 0.9290363986430733, + "learning_rate": 1.4194553956174932e-05, + "loss": 0.9925, + "mean_token_accuracy": 0.7028466284275054, + "num_tokens": 251444125.0, + "step": 101330 + }, + { + "epoch": 0.9291280828825524, + "learning_rate": 1.4176217108279088e-05, + "loss": 0.9431, + "mean_token_accuracy": 0.7126602232456207, + "num_tokens": 251472825.0, + "step": 101340 + }, + { + "epoch": 0.9292197671220317, + "learning_rate": 1.4157880260383241e-05, + "loss": 0.9588, + "mean_token_accuracy": 0.7097715973854065, + "num_tokens": 251500351.0, + "step": 101350 + }, + { + "epoch": 0.9293114513615109, + "learning_rate": 1.4139543412487393e-05, + "loss": 0.963, + "mean_token_accuracy": 0.7072455525398255, + "num_tokens": 251528803.0, + "step": 101360 + }, + { + "epoch": 0.9294031356009902, + "learning_rate": 1.4121206564591547e-05, + "loss": 0.9476, + "mean_token_accuracy": 0.7109055340290069, + "num_tokens": 251557303.0, + "step": 101370 + }, + { + "epoch": 0.9294948198404694, + "learning_rate": 1.4102869716695702e-05, + "loss": 0.9617, + "mean_token_accuracy": 0.7036132216453552, + "num_tokens": 251585660.0, + "step": 101380 + }, + { + "epoch": 0.9295865040799487, + "learning_rate": 1.4084532868799854e-05, + "loss": 0.9465, + "mean_token_accuracy": 0.7148278295993805, + "num_tokens": 251614408.0, + "step": 101390 + }, + { + "epoch": 0.929678188319428, + "learning_rate": 1.4066196020904007e-05, + "loss": 0.9454, + "mean_token_accuracy": 0.7096316576004028, + "num_tokens": 251642152.0, + "step": 101400 + }, + { + "epoch": 0.9297698725589071, + "learning_rate": 1.404785917300816e-05, + "loss": 0.9912, + "mean_token_accuracy": 0.7031850814819336, + "num_tokens": 251670052.0, + "step": 101410 + }, + { + "epoch": 0.9298615567983863, + "learning_rate": 1.4029522325112313e-05, + "loss": 0.9436, + "mean_token_accuracy": 0.7077620148658752, + "num_tokens": 251698642.0, + "step": 101420 + }, + { + "epoch": 0.9299532410378656, + "learning_rate": 1.4011185477216468e-05, + "loss": 0.97, + "mean_token_accuracy": 0.701517003774643, + "num_tokens": 251727569.0, + "step": 101430 + }, + { + "epoch": 0.9300449252773448, + "learning_rate": 1.399284862932062e-05, + "loss": 0.9476, + "mean_token_accuracy": 0.7125502228736877, + "num_tokens": 251755531.0, + "step": 101440 + }, + { + "epoch": 0.9301366095168241, + "learning_rate": 1.3974511781424774e-05, + "loss": 0.9625, + "mean_token_accuracy": 0.708078944683075, + "num_tokens": 251782304.0, + "step": 101450 + }, + { + "epoch": 0.9302282937563033, + "learning_rate": 1.3956174933528925e-05, + "loss": 0.9653, + "mean_token_accuracy": 0.7106375336647034, + "num_tokens": 251809774.0, + "step": 101460 + }, + { + "epoch": 0.9303199779957825, + "learning_rate": 1.393783808563308e-05, + "loss": 0.9236, + "mean_token_accuracy": 0.7176149249076843, + "num_tokens": 251837524.0, + "step": 101470 + }, + { + "epoch": 0.9304116622352617, + "learning_rate": 1.3919501237737234e-05, + "loss": 0.9498, + "mean_token_accuracy": 0.7041159570217133, + "num_tokens": 251865288.0, + "step": 101480 + }, + { + "epoch": 0.930503346474741, + "learning_rate": 1.3901164389841386e-05, + "loss": 0.9685, + "mean_token_accuracy": 0.709986287355423, + "num_tokens": 251893657.0, + "step": 101490 + }, + { + "epoch": 0.9305950307142202, + "learning_rate": 1.388282754194554e-05, + "loss": 0.9724, + "mean_token_accuracy": 0.7070633471012115, + "num_tokens": 251922286.0, + "step": 101500 + }, + { + "epoch": 0.9306867149536995, + "learning_rate": 1.3864490694049692e-05, + "loss": 0.9595, + "mean_token_accuracy": 0.7094040215015411, + "num_tokens": 251949615.0, + "step": 101510 + }, + { + "epoch": 0.9307783991931787, + "learning_rate": 1.3846153846153847e-05, + "loss": 0.9574, + "mean_token_accuracy": 0.7079304873943328, + "num_tokens": 251977913.0, + "step": 101520 + }, + { + "epoch": 0.930870083432658, + "learning_rate": 1.3827816998258e-05, + "loss": 0.9481, + "mean_token_accuracy": 0.7147959291934967, + "num_tokens": 252006111.0, + "step": 101530 + }, + { + "epoch": 0.9309617676721371, + "learning_rate": 1.3809480150362152e-05, + "loss": 0.9494, + "mean_token_accuracy": 0.7095328748226166, + "num_tokens": 252033972.0, + "step": 101540 + }, + { + "epoch": 0.9310534519116164, + "learning_rate": 1.3791143302466306e-05, + "loss": 0.9193, + "mean_token_accuracy": 0.7209644436836242, + "num_tokens": 252061731.0, + "step": 101550 + }, + { + "epoch": 0.9311451361510956, + "learning_rate": 1.3772806454570461e-05, + "loss": 0.9397, + "mean_token_accuracy": 0.7114929676055908, + "num_tokens": 252089921.0, + "step": 101560 + }, + { + "epoch": 0.9312368203905749, + "learning_rate": 1.3754469606674613e-05, + "loss": 0.9446, + "mean_token_accuracy": 0.7108826100826263, + "num_tokens": 252117592.0, + "step": 101570 + }, + { + "epoch": 0.9313285046300541, + "learning_rate": 1.3736132758778766e-05, + "loss": 0.9357, + "mean_token_accuracy": 0.714998471736908, + "num_tokens": 252145036.0, + "step": 101580 + }, + { + "epoch": 0.9314201888695334, + "learning_rate": 1.3717795910882918e-05, + "loss": 0.9509, + "mean_token_accuracy": 0.7109091997146606, + "num_tokens": 252173369.0, + "step": 101590 + }, + { + "epoch": 0.9315118731090125, + "learning_rate": 1.3699459062987075e-05, + "loss": 0.9446, + "mean_token_accuracy": 0.7140315294265747, + "num_tokens": 252201094.0, + "step": 101600 + }, + { + "epoch": 0.9316035573484918, + "learning_rate": 1.3681122215091227e-05, + "loss": 0.9568, + "mean_token_accuracy": 0.707772308588028, + "num_tokens": 252228076.0, + "step": 101610 + }, + { + "epoch": 0.931695241587971, + "learning_rate": 1.3662785367195379e-05, + "loss": 0.9364, + "mean_token_accuracy": 0.7147785305976868, + "num_tokens": 252255759.0, + "step": 101620 + }, + { + "epoch": 0.9317869258274503, + "learning_rate": 1.3644448519299533e-05, + "loss": 0.9598, + "mean_token_accuracy": 0.7093723058700562, + "num_tokens": 252283682.0, + "step": 101630 + }, + { + "epoch": 0.9318786100669295, + "learning_rate": 1.3626111671403684e-05, + "loss": 0.965, + "mean_token_accuracy": 0.7094361782073975, + "num_tokens": 252311610.0, + "step": 101640 + }, + { + "epoch": 0.9319702943064088, + "learning_rate": 1.3607774823507841e-05, + "loss": 0.9531, + "mean_token_accuracy": 0.7079195976257324, + "num_tokens": 252339223.0, + "step": 101650 + }, + { + "epoch": 0.932061978545888, + "learning_rate": 1.3589437975611993e-05, + "loss": 0.9299, + "mean_token_accuracy": 0.7151159167289733, + "num_tokens": 252367776.0, + "step": 101660 + }, + { + "epoch": 0.9321536627853672, + "learning_rate": 1.3571101127716145e-05, + "loss": 0.9566, + "mean_token_accuracy": 0.7099621832370758, + "num_tokens": 252395613.0, + "step": 101670 + }, + { + "epoch": 0.9322453470248464, + "learning_rate": 1.3552764279820299e-05, + "loss": 0.987, + "mean_token_accuracy": 0.7034406185150146, + "num_tokens": 252423526.0, + "step": 101680 + }, + { + "epoch": 0.9323370312643257, + "learning_rate": 1.3534427431924454e-05, + "loss": 0.9181, + "mean_token_accuracy": 0.7155993700027465, + "num_tokens": 252451375.0, + "step": 101690 + }, + { + "epoch": 0.9324287155038049, + "learning_rate": 1.3516090584028607e-05, + "loss": 0.9643, + "mean_token_accuracy": 0.712075161933899, + "num_tokens": 252479086.0, + "step": 101700 + }, + { + "epoch": 0.9325203997432842, + "learning_rate": 1.349775373613276e-05, + "loss": 0.9352, + "mean_token_accuracy": 0.7157521069049835, + "num_tokens": 252507028.0, + "step": 101710 + }, + { + "epoch": 0.9326120839827634, + "learning_rate": 1.3479416888236911e-05, + "loss": 0.961, + "mean_token_accuracy": 0.7072499692440033, + "num_tokens": 252534821.0, + "step": 101720 + }, + { + "epoch": 0.9327037682222425, + "learning_rate": 1.3461080040341065e-05, + "loss": 0.9684, + "mean_token_accuracy": 0.7069429457187653, + "num_tokens": 252563456.0, + "step": 101730 + }, + { + "epoch": 0.9327954524617218, + "learning_rate": 1.344274319244522e-05, + "loss": 0.9268, + "mean_token_accuracy": 0.7155016183853149, + "num_tokens": 252590277.0, + "step": 101740 + }, + { + "epoch": 0.932887136701201, + "learning_rate": 1.3424406344549374e-05, + "loss": 0.954, + "mean_token_accuracy": 0.710516220331192, + "num_tokens": 252617635.0, + "step": 101750 + }, + { + "epoch": 0.9329788209406803, + "learning_rate": 1.3406069496653525e-05, + "loss": 0.9457, + "mean_token_accuracy": 0.7113356769084931, + "num_tokens": 252645654.0, + "step": 101760 + }, + { + "epoch": 0.9330705051801595, + "learning_rate": 1.3387732648757679e-05, + "loss": 0.9324, + "mean_token_accuracy": 0.7156642973423004, + "num_tokens": 252674099.0, + "step": 101770 + }, + { + "epoch": 0.9331621894196388, + "learning_rate": 1.3369395800861834e-05, + "loss": 0.9484, + "mean_token_accuracy": 0.7076420068740845, + "num_tokens": 252702306.0, + "step": 101780 + }, + { + "epoch": 0.933253873659118, + "learning_rate": 1.3351058952965986e-05, + "loss": 0.9529, + "mean_token_accuracy": 0.7138663232326508, + "num_tokens": 252729853.0, + "step": 101790 + }, + { + "epoch": 0.9333455578985972, + "learning_rate": 1.333272210507014e-05, + "loss": 0.9299, + "mean_token_accuracy": 0.7191498577594757, + "num_tokens": 252756698.0, + "step": 101800 + }, + { + "epoch": 0.9334372421380764, + "learning_rate": 1.3314385257174292e-05, + "loss": 0.9384, + "mean_token_accuracy": 0.7146835505962372, + "num_tokens": 252783938.0, + "step": 101810 + }, + { + "epoch": 0.9335289263775557, + "learning_rate": 1.3296048409278445e-05, + "loss": 0.9572, + "mean_token_accuracy": 0.7084337413311005, + "num_tokens": 252811611.0, + "step": 101820 + }, + { + "epoch": 0.9336206106170349, + "learning_rate": 1.32777115613826e-05, + "loss": 0.9605, + "mean_token_accuracy": 0.7086575090885162, + "num_tokens": 252839895.0, + "step": 101830 + }, + { + "epoch": 0.9337122948565142, + "learning_rate": 1.3259374713486752e-05, + "loss": 0.9679, + "mean_token_accuracy": 0.7077599704265595, + "num_tokens": 252867833.0, + "step": 101840 + }, + { + "epoch": 0.9338039790959934, + "learning_rate": 1.3241037865590906e-05, + "loss": 0.9604, + "mean_token_accuracy": 0.71173597574234, + "num_tokens": 252895954.0, + "step": 101850 + }, + { + "epoch": 0.9338956633354726, + "learning_rate": 1.3222701017695058e-05, + "loss": 0.9773, + "mean_token_accuracy": 0.7013697922229767, + "num_tokens": 252924627.0, + "step": 101860 + }, + { + "epoch": 0.9339873475749518, + "learning_rate": 1.3204364169799213e-05, + "loss": 0.9359, + "mean_token_accuracy": 0.7167365610599518, + "num_tokens": 252953616.0, + "step": 101870 + }, + { + "epoch": 0.9340790318144311, + "learning_rate": 1.3186027321903367e-05, + "loss": 0.9209, + "mean_token_accuracy": 0.7197913587093353, + "num_tokens": 252981384.0, + "step": 101880 + }, + { + "epoch": 0.9341707160539103, + "learning_rate": 1.3167690474007518e-05, + "loss": 0.9075, + "mean_token_accuracy": 0.7227952063083649, + "num_tokens": 253009639.0, + "step": 101890 + }, + { + "epoch": 0.9342624002933896, + "learning_rate": 1.3149353626111672e-05, + "loss": 0.9629, + "mean_token_accuracy": 0.7085484147071839, + "num_tokens": 253036932.0, + "step": 101900 + }, + { + "epoch": 0.9343540845328688, + "learning_rate": 1.3131016778215827e-05, + "loss": 0.934, + "mean_token_accuracy": 0.7167655944824218, + "num_tokens": 253064856.0, + "step": 101910 + }, + { + "epoch": 0.9344457687723481, + "learning_rate": 1.3112679930319979e-05, + "loss": 0.9563, + "mean_token_accuracy": 0.7140512526035309, + "num_tokens": 253092877.0, + "step": 101920 + }, + { + "epoch": 0.9345374530118272, + "learning_rate": 1.3094343082424133e-05, + "loss": 0.9385, + "mean_token_accuracy": 0.711508572101593, + "num_tokens": 253120696.0, + "step": 101930 + }, + { + "epoch": 0.9346291372513065, + "learning_rate": 1.3076006234528284e-05, + "loss": 0.9281, + "mean_token_accuracy": 0.7137085556983948, + "num_tokens": 253148616.0, + "step": 101940 + }, + { + "epoch": 0.9347208214907857, + "learning_rate": 1.3057669386632438e-05, + "loss": 0.9541, + "mean_token_accuracy": 0.7092041730880737, + "num_tokens": 253176685.0, + "step": 101950 + }, + { + "epoch": 0.934812505730265, + "learning_rate": 1.3039332538736593e-05, + "loss": 0.954, + "mean_token_accuracy": 0.7092980742454529, + "num_tokens": 253204508.0, + "step": 101960 + }, + { + "epoch": 0.9349041899697442, + "learning_rate": 1.3020995690840745e-05, + "loss": 0.9491, + "mean_token_accuracy": 0.7087125301361084, + "num_tokens": 253232864.0, + "step": 101970 + }, + { + "epoch": 0.9349958742092235, + "learning_rate": 1.3002658842944899e-05, + "loss": 0.9567, + "mean_token_accuracy": 0.708165442943573, + "num_tokens": 253260119.0, + "step": 101980 + }, + { + "epoch": 0.9350875584487026, + "learning_rate": 1.298432199504905e-05, + "loss": 0.9617, + "mean_token_accuracy": 0.7049558699131012, + "num_tokens": 253287693.0, + "step": 101990 + }, + { + "epoch": 0.9351792426881819, + "learning_rate": 1.2965985147153206e-05, + "loss": 0.9632, + "mean_token_accuracy": 0.7053045332431793, + "num_tokens": 253316909.0, + "step": 102000 + }, + { + "epoch": 0.9352709269276611, + "learning_rate": 1.294764829925736e-05, + "loss": 0.9534, + "mean_token_accuracy": 0.7133051753044128, + "num_tokens": 253344304.0, + "step": 102010 + }, + { + "epoch": 0.9353626111671404, + "learning_rate": 1.2929311451361511e-05, + "loss": 0.9526, + "mean_token_accuracy": 0.7138311803340912, + "num_tokens": 253372145.0, + "step": 102020 + }, + { + "epoch": 0.9354542954066196, + "learning_rate": 1.2910974603465665e-05, + "loss": 0.9742, + "mean_token_accuracy": 0.7077650666236878, + "num_tokens": 253400686.0, + "step": 102030 + }, + { + "epoch": 0.9355459796460989, + "learning_rate": 1.2892637755569817e-05, + "loss": 0.9608, + "mean_token_accuracy": 0.7084186375141144, + "num_tokens": 253429197.0, + "step": 102040 + }, + { + "epoch": 0.9356376638855781, + "learning_rate": 1.2874300907673972e-05, + "loss": 0.9211, + "mean_token_accuracy": 0.7175590336322785, + "num_tokens": 253457161.0, + "step": 102050 + }, + { + "epoch": 0.9357293481250573, + "learning_rate": 1.2855964059778126e-05, + "loss": 0.9631, + "mean_token_accuracy": 0.7109842479228974, + "num_tokens": 253485237.0, + "step": 102060 + }, + { + "epoch": 0.9358210323645365, + "learning_rate": 1.2837627211882277e-05, + "loss": 0.9629, + "mean_token_accuracy": 0.7063953459262848, + "num_tokens": 253514390.0, + "step": 102070 + }, + { + "epoch": 0.9359127166040158, + "learning_rate": 1.2819290363986431e-05, + "loss": 0.9619, + "mean_token_accuracy": 0.7067668616771698, + "num_tokens": 253542531.0, + "step": 102080 + }, + { + "epoch": 0.936004400843495, + "learning_rate": 1.2800953516090586e-05, + "loss": 0.9593, + "mean_token_accuracy": 0.7030080020427704, + "num_tokens": 253569624.0, + "step": 102090 + }, + { + "epoch": 0.9360960850829743, + "learning_rate": 1.2782616668194738e-05, + "loss": 0.9374, + "mean_token_accuracy": 0.7127783238887787, + "num_tokens": 253596874.0, + "step": 102100 + }, + { + "epoch": 0.9361877693224535, + "learning_rate": 1.2764279820298892e-05, + "loss": 0.9839, + "mean_token_accuracy": 0.6990141153335572, + "num_tokens": 253624378.0, + "step": 102110 + }, + { + "epoch": 0.9362794535619327, + "learning_rate": 1.2745942972403044e-05, + "loss": 0.9601, + "mean_token_accuracy": 0.7078054070472717, + "num_tokens": 253651947.0, + "step": 102120 + }, + { + "epoch": 0.9363711378014119, + "learning_rate": 1.2727606124507197e-05, + "loss": 0.9349, + "mean_token_accuracy": 0.7184051156044007, + "num_tokens": 253680296.0, + "step": 102130 + }, + { + "epoch": 0.9364628220408912, + "learning_rate": 1.2709269276611352e-05, + "loss": 0.9666, + "mean_token_accuracy": 0.7019192457199097, + "num_tokens": 253708585.0, + "step": 102140 + }, + { + "epoch": 0.9365545062803704, + "learning_rate": 1.2690932428715504e-05, + "loss": 0.9409, + "mean_token_accuracy": 0.713731199502945, + "num_tokens": 253735826.0, + "step": 102150 + }, + { + "epoch": 0.9366461905198497, + "learning_rate": 1.2672595580819658e-05, + "loss": 0.9334, + "mean_token_accuracy": 0.7147872805595398, + "num_tokens": 253762513.0, + "step": 102160 + }, + { + "epoch": 0.9367378747593289, + "learning_rate": 1.265425873292381e-05, + "loss": 0.9461, + "mean_token_accuracy": 0.7095882177352906, + "num_tokens": 253790226.0, + "step": 102170 + }, + { + "epoch": 0.9368295589988082, + "learning_rate": 1.2635921885027965e-05, + "loss": 0.9557, + "mean_token_accuracy": 0.7096666812896728, + "num_tokens": 253818231.0, + "step": 102180 + }, + { + "epoch": 0.9369212432382873, + "learning_rate": 1.2617585037132118e-05, + "loss": 0.9768, + "mean_token_accuracy": 0.706231164932251, + "num_tokens": 253846390.0, + "step": 102190 + }, + { + "epoch": 0.9370129274777665, + "learning_rate": 1.259924818923627e-05, + "loss": 0.9545, + "mean_token_accuracy": 0.7078743278980255, + "num_tokens": 253874150.0, + "step": 102200 + }, + { + "epoch": 0.9371046117172458, + "learning_rate": 1.2580911341340424e-05, + "loss": 0.9565, + "mean_token_accuracy": 0.7112432301044465, + "num_tokens": 253902431.0, + "step": 102210 + }, + { + "epoch": 0.937196295956725, + "learning_rate": 1.2562574493444579e-05, + "loss": 0.93, + "mean_token_accuracy": 0.7090595901012421, + "num_tokens": 253930473.0, + "step": 102220 + }, + { + "epoch": 0.9372879801962043, + "learning_rate": 1.2544237645548731e-05, + "loss": 0.9554, + "mean_token_accuracy": 0.7088334858417511, + "num_tokens": 253958093.0, + "step": 102230 + }, + { + "epoch": 0.9373796644356835, + "learning_rate": 1.2525900797652885e-05, + "loss": 0.9422, + "mean_token_accuracy": 0.7113230943679809, + "num_tokens": 253985350.0, + "step": 102240 + }, + { + "epoch": 0.9374713486751627, + "learning_rate": 1.2507563949757036e-05, + "loss": 0.9302, + "mean_token_accuracy": 0.7184086322784424, + "num_tokens": 254013143.0, + "step": 102250 + }, + { + "epoch": 0.9375630329146419, + "learning_rate": 1.2489227101861192e-05, + "loss": 0.9352, + "mean_token_accuracy": 0.7166255116462708, + "num_tokens": 254040989.0, + "step": 102260 + }, + { + "epoch": 0.9376547171541212, + "learning_rate": 1.2470890253965344e-05, + "loss": 0.9744, + "mean_token_accuracy": 0.7072222352027893, + "num_tokens": 254069361.0, + "step": 102270 + }, + { + "epoch": 0.9377464013936004, + "learning_rate": 1.2452553406069497e-05, + "loss": 0.9537, + "mean_token_accuracy": 0.7117165207862854, + "num_tokens": 254096868.0, + "step": 102280 + }, + { + "epoch": 0.9378380856330797, + "learning_rate": 1.243421655817365e-05, + "loss": 0.965, + "mean_token_accuracy": 0.7056435406208038, + "num_tokens": 254124369.0, + "step": 102290 + }, + { + "epoch": 0.9379297698725589, + "learning_rate": 1.2415879710277804e-05, + "loss": 0.9713, + "mean_token_accuracy": 0.7107076525688172, + "num_tokens": 254152127.0, + "step": 102300 + }, + { + "epoch": 0.9380214541120382, + "learning_rate": 1.2397542862381958e-05, + "loss": 0.9778, + "mean_token_accuracy": 0.7051454901695251, + "num_tokens": 254180863.0, + "step": 102310 + }, + { + "epoch": 0.9381131383515173, + "learning_rate": 1.2379206014486111e-05, + "loss": 0.9682, + "mean_token_accuracy": 0.7083398342132569, + "num_tokens": 254209016.0, + "step": 102320 + }, + { + "epoch": 0.9382048225909966, + "learning_rate": 1.2360869166590263e-05, + "loss": 0.9294, + "mean_token_accuracy": 0.7196935713291168, + "num_tokens": 254236176.0, + "step": 102330 + }, + { + "epoch": 0.9382965068304758, + "learning_rate": 1.2342532318694417e-05, + "loss": 0.9597, + "mean_token_accuracy": 0.7071610927581787, + "num_tokens": 254263966.0, + "step": 102340 + }, + { + "epoch": 0.9383881910699551, + "learning_rate": 1.232419547079857e-05, + "loss": 0.9621, + "mean_token_accuracy": 0.7054771661758423, + "num_tokens": 254291939.0, + "step": 102350 + }, + { + "epoch": 0.9384798753094343, + "learning_rate": 1.2305858622902724e-05, + "loss": 0.9584, + "mean_token_accuracy": 0.7100796222686767, + "num_tokens": 254319702.0, + "step": 102360 + }, + { + "epoch": 0.9385715595489136, + "learning_rate": 1.2287521775006877e-05, + "loss": 0.9913, + "mean_token_accuracy": 0.7060858964920044, + "num_tokens": 254347511.0, + "step": 102370 + }, + { + "epoch": 0.9386632437883927, + "learning_rate": 1.226918492711103e-05, + "loss": 0.9714, + "mean_token_accuracy": 0.7083201467990875, + "num_tokens": 254376053.0, + "step": 102380 + }, + { + "epoch": 0.938754928027872, + "learning_rate": 1.2250848079215185e-05, + "loss": 0.973, + "mean_token_accuracy": 0.7036384522914887, + "num_tokens": 254404048.0, + "step": 102390 + }, + { + "epoch": 0.9388466122673512, + "learning_rate": 1.2232511231319336e-05, + "loss": 0.9503, + "mean_token_accuracy": 0.7131141543388366, + "num_tokens": 254431605.0, + "step": 102400 + }, + { + "epoch": 0.9389382965068305, + "learning_rate": 1.221417438342349e-05, + "loss": 0.9388, + "mean_token_accuracy": 0.7128082752227783, + "num_tokens": 254459806.0, + "step": 102410 + }, + { + "epoch": 0.9390299807463097, + "learning_rate": 1.2195837535527644e-05, + "loss": 0.9712, + "mean_token_accuracy": 0.7045019030570984, + "num_tokens": 254487273.0, + "step": 102420 + }, + { + "epoch": 0.939121664985789, + "learning_rate": 1.2177500687631797e-05, + "loss": 0.9457, + "mean_token_accuracy": 0.7112976431846618, + "num_tokens": 254515332.0, + "step": 102430 + }, + { + "epoch": 0.9392133492252682, + "learning_rate": 1.215916383973595e-05, + "loss": 0.93, + "mean_token_accuracy": 0.7165105700492859, + "num_tokens": 254543712.0, + "step": 102440 + }, + { + "epoch": 0.9393050334647474, + "learning_rate": 1.2140826991840103e-05, + "loss": 0.9363, + "mean_token_accuracy": 0.7132966458797455, + "num_tokens": 254572780.0, + "step": 102450 + }, + { + "epoch": 0.9393967177042266, + "learning_rate": 1.2122490143944256e-05, + "loss": 0.9426, + "mean_token_accuracy": 0.7113722503185272, + "num_tokens": 254600234.0, + "step": 102460 + }, + { + "epoch": 0.9394884019437059, + "learning_rate": 1.210415329604841e-05, + "loss": 0.9723, + "mean_token_accuracy": 0.706432455778122, + "num_tokens": 254628822.0, + "step": 102470 + }, + { + "epoch": 0.9395800861831851, + "learning_rate": 1.2085816448152563e-05, + "loss": 0.9545, + "mean_token_accuracy": 0.7113306283950805, + "num_tokens": 254657481.0, + "step": 102480 + }, + { + "epoch": 0.9396717704226644, + "learning_rate": 1.2067479600256717e-05, + "loss": 0.9716, + "mean_token_accuracy": 0.7082769691944122, + "num_tokens": 254684772.0, + "step": 102490 + }, + { + "epoch": 0.9397634546621436, + "learning_rate": 1.204914275236087e-05, + "loss": 0.9264, + "mean_token_accuracy": 0.718409514427185, + "num_tokens": 254711876.0, + "step": 102500 + }, + { + "epoch": 0.9398551389016229, + "learning_rate": 1.2030805904465022e-05, + "loss": 0.9726, + "mean_token_accuracy": 0.6997957825660706, + "num_tokens": 254740231.0, + "step": 102510 + }, + { + "epoch": 0.939946823141102, + "learning_rate": 1.2012469056569178e-05, + "loss": 0.9299, + "mean_token_accuracy": 0.7119948267936707, + "num_tokens": 254768375.0, + "step": 102520 + }, + { + "epoch": 0.9400385073805813, + "learning_rate": 1.199413220867333e-05, + "loss": 0.9598, + "mean_token_accuracy": 0.708594286441803, + "num_tokens": 254795435.0, + "step": 102530 + }, + { + "epoch": 0.9401301916200605, + "learning_rate": 1.1975795360777483e-05, + "loss": 0.9742, + "mean_token_accuracy": 0.7056930780410766, + "num_tokens": 254823645.0, + "step": 102540 + }, + { + "epoch": 0.9402218758595398, + "learning_rate": 1.1957458512881636e-05, + "loss": 0.9364, + "mean_token_accuracy": 0.7146631479263306, + "num_tokens": 254850616.0, + "step": 102550 + }, + { + "epoch": 0.940313560099019, + "learning_rate": 1.1939121664985788e-05, + "loss": 0.9171, + "mean_token_accuracy": 0.7172474384307861, + "num_tokens": 254878318.0, + "step": 102560 + }, + { + "epoch": 0.9404052443384983, + "learning_rate": 1.1920784817089944e-05, + "loss": 0.9188, + "mean_token_accuracy": 0.7150501072406769, + "num_tokens": 254906065.0, + "step": 102570 + }, + { + "epoch": 0.9404969285779774, + "learning_rate": 1.1902447969194095e-05, + "loss": 0.9454, + "mean_token_accuracy": 0.7106794238090515, + "num_tokens": 254933663.0, + "step": 102580 + }, + { + "epoch": 0.9405886128174566, + "learning_rate": 1.1884111121298249e-05, + "loss": 0.9727, + "mean_token_accuracy": 0.7085217356681823, + "num_tokens": 254961576.0, + "step": 102590 + }, + { + "epoch": 0.9406802970569359, + "learning_rate": 1.1865774273402403e-05, + "loss": 0.9957, + "mean_token_accuracy": 0.7010318994522095, + "num_tokens": 254989926.0, + "step": 102600 + }, + { + "epoch": 0.9407719812964151, + "learning_rate": 1.1847437425506556e-05, + "loss": 0.9675, + "mean_token_accuracy": 0.7058118462562561, + "num_tokens": 255018011.0, + "step": 102610 + }, + { + "epoch": 0.9408636655358944, + "learning_rate": 1.182910057761071e-05, + "loss": 0.9388, + "mean_token_accuracy": 0.7153486907482147, + "num_tokens": 255046107.0, + "step": 102620 + }, + { + "epoch": 0.9409553497753737, + "learning_rate": 1.1810763729714863e-05, + "loss": 0.9451, + "mean_token_accuracy": 0.708610600233078, + "num_tokens": 255074703.0, + "step": 102630 + }, + { + "epoch": 0.9410470340148529, + "learning_rate": 1.1792426881819015e-05, + "loss": 0.9487, + "mean_token_accuracy": 0.7160908460617066, + "num_tokens": 255102673.0, + "step": 102640 + }, + { + "epoch": 0.941138718254332, + "learning_rate": 1.1774090033923169e-05, + "loss": 0.9296, + "mean_token_accuracy": 0.7148681581020355, + "num_tokens": 255130748.0, + "step": 102650 + }, + { + "epoch": 0.9412304024938113, + "learning_rate": 1.1755753186027322e-05, + "loss": 0.9211, + "mean_token_accuracy": 0.7172384858131409, + "num_tokens": 255159178.0, + "step": 102660 + }, + { + "epoch": 0.9413220867332905, + "learning_rate": 1.1737416338131476e-05, + "loss": 0.9517, + "mean_token_accuracy": 0.7140165328979492, + "num_tokens": 255186210.0, + "step": 102670 + }, + { + "epoch": 0.9414137709727698, + "learning_rate": 1.171907949023563e-05, + "loss": 0.9305, + "mean_token_accuracy": 0.7180571615695953, + "num_tokens": 255213123.0, + "step": 102680 + }, + { + "epoch": 0.941505455212249, + "learning_rate": 1.1700742642339781e-05, + "loss": 0.954, + "mean_token_accuracy": 0.7052584767341614, + "num_tokens": 255241689.0, + "step": 102690 + }, + { + "epoch": 0.9415971394517283, + "learning_rate": 1.1682405794443937e-05, + "loss": 0.9402, + "mean_token_accuracy": 0.7112890183925629, + "num_tokens": 255270439.0, + "step": 102700 + }, + { + "epoch": 0.9416888236912074, + "learning_rate": 1.1664068946548088e-05, + "loss": 0.9901, + "mean_token_accuracy": 0.7062026262283325, + "num_tokens": 255298352.0, + "step": 102710 + }, + { + "epoch": 0.9417805079306867, + "learning_rate": 1.1645732098652242e-05, + "loss": 0.9602, + "mean_token_accuracy": 0.7041107833385467, + "num_tokens": 255327198.0, + "step": 102720 + }, + { + "epoch": 0.9418721921701659, + "learning_rate": 1.1627395250756396e-05, + "loss": 0.9666, + "mean_token_accuracy": 0.7073990762233734, + "num_tokens": 255355082.0, + "step": 102730 + }, + { + "epoch": 0.9419638764096452, + "learning_rate": 1.1609058402860549e-05, + "loss": 0.9532, + "mean_token_accuracy": 0.7126502692699432, + "num_tokens": 255382685.0, + "step": 102740 + }, + { + "epoch": 0.9420555606491244, + "learning_rate": 1.1590721554964703e-05, + "loss": 0.9282, + "mean_token_accuracy": 0.7141442239284516, + "num_tokens": 255409901.0, + "step": 102750 + }, + { + "epoch": 0.9421472448886037, + "learning_rate": 1.1572384707068855e-05, + "loss": 0.972, + "mean_token_accuracy": 0.70137899518013, + "num_tokens": 255438524.0, + "step": 102760 + }, + { + "epoch": 0.9422389291280829, + "learning_rate": 1.1554047859173008e-05, + "loss": 0.9561, + "mean_token_accuracy": 0.710118705034256, + "num_tokens": 255467764.0, + "step": 102770 + }, + { + "epoch": 0.9423306133675621, + "learning_rate": 1.1535711011277162e-05, + "loss": 0.9489, + "mean_token_accuracy": 0.7068646609783172, + "num_tokens": 255496428.0, + "step": 102780 + }, + { + "epoch": 0.9424222976070413, + "learning_rate": 1.1517374163381315e-05, + "loss": 0.9485, + "mean_token_accuracy": 0.7078204989433289, + "num_tokens": 255524565.0, + "step": 102790 + }, + { + "epoch": 0.9425139818465206, + "learning_rate": 1.1499037315485469e-05, + "loss": 0.954, + "mean_token_accuracy": 0.7103520512580872, + "num_tokens": 255551758.0, + "step": 102800 + }, + { + "epoch": 0.9426056660859998, + "learning_rate": 1.1480700467589622e-05, + "loss": 0.9442, + "mean_token_accuracy": 0.7119756937026978, + "num_tokens": 255579314.0, + "step": 102810 + }, + { + "epoch": 0.9426973503254791, + "learning_rate": 1.1462363619693774e-05, + "loss": 0.9523, + "mean_token_accuracy": 0.7119636416435242, + "num_tokens": 255607939.0, + "step": 102820 + }, + { + "epoch": 0.9427890345649583, + "learning_rate": 1.144402677179793e-05, + "loss": 0.9103, + "mean_token_accuracy": 0.7157583832740784, + "num_tokens": 255636202.0, + "step": 102830 + }, + { + "epoch": 0.9428807188044375, + "learning_rate": 1.1425689923902081e-05, + "loss": 0.9288, + "mean_token_accuracy": 0.7167107999324799, + "num_tokens": 255662473.0, + "step": 102840 + }, + { + "epoch": 0.9429724030439167, + "learning_rate": 1.1407353076006235e-05, + "loss": 0.9504, + "mean_token_accuracy": 0.713322114944458, + "num_tokens": 255691494.0, + "step": 102850 + }, + { + "epoch": 0.943064087283396, + "learning_rate": 1.1389016228110388e-05, + "loss": 0.9028, + "mean_token_accuracy": 0.7244246780872345, + "num_tokens": 255718669.0, + "step": 102860 + }, + { + "epoch": 0.9431557715228752, + "learning_rate": 1.1370679380214542e-05, + "loss": 0.944, + "mean_token_accuracy": 0.7100665211677551, + "num_tokens": 255746572.0, + "step": 102870 + }, + { + "epoch": 0.9432474557623545, + "learning_rate": 1.1352342532318696e-05, + "loss": 0.9769, + "mean_token_accuracy": 0.7085854828357696, + "num_tokens": 255773817.0, + "step": 102880 + }, + { + "epoch": 0.9433391400018337, + "learning_rate": 1.1334005684422847e-05, + "loss": 0.9391, + "mean_token_accuracy": 0.7132640063762665, + "num_tokens": 255801392.0, + "step": 102890 + }, + { + "epoch": 0.943430824241313, + "learning_rate": 1.1315668836527003e-05, + "loss": 0.9796, + "mean_token_accuracy": 0.7016677379608154, + "num_tokens": 255829170.0, + "step": 102900 + }, + { + "epoch": 0.9435225084807921, + "learning_rate": 1.1297331988631155e-05, + "loss": 0.9782, + "mean_token_accuracy": 0.7059294164180756, + "num_tokens": 255856735.0, + "step": 102910 + }, + { + "epoch": 0.9436141927202714, + "learning_rate": 1.1278995140735308e-05, + "loss": 0.9449, + "mean_token_accuracy": 0.7062544524669647, + "num_tokens": 255885068.0, + "step": 102920 + }, + { + "epoch": 0.9437058769597506, + "learning_rate": 1.1260658292839462e-05, + "loss": 0.9609, + "mean_token_accuracy": 0.7042105615139007, + "num_tokens": 255913407.0, + "step": 102930 + }, + { + "epoch": 0.9437975611992299, + "learning_rate": 1.1242321444943615e-05, + "loss": 0.9595, + "mean_token_accuracy": 0.706026577949524, + "num_tokens": 255940903.0, + "step": 102940 + }, + { + "epoch": 0.9438892454387091, + "learning_rate": 1.1223984597047769e-05, + "loss": 0.919, + "mean_token_accuracy": 0.7188919186592102, + "num_tokens": 255969553.0, + "step": 102950 + }, + { + "epoch": 0.9439809296781884, + "learning_rate": 1.120564774915192e-05, + "loss": 0.953, + "mean_token_accuracy": 0.7064568102359772, + "num_tokens": 255996700.0, + "step": 102960 + }, + { + "epoch": 0.9440726139176675, + "learning_rate": 1.1187310901256074e-05, + "loss": 0.9773, + "mean_token_accuracy": 0.7042794942855835, + "num_tokens": 256026068.0, + "step": 102970 + }, + { + "epoch": 0.9441642981571468, + "learning_rate": 1.1168974053360228e-05, + "loss": 0.9851, + "mean_token_accuracy": 0.7081849694252014, + "num_tokens": 256054448.0, + "step": 102980 + }, + { + "epoch": 0.944255982396626, + "learning_rate": 1.1150637205464381e-05, + "loss": 0.9317, + "mean_token_accuracy": 0.7123378932476043, + "num_tokens": 256082585.0, + "step": 102990 + }, + { + "epoch": 0.9443476666361053, + "learning_rate": 1.1132300357568535e-05, + "loss": 0.9662, + "mean_token_accuracy": 0.7105158627033233, + "num_tokens": 256110622.0, + "step": 103000 + }, + { + "epoch": 0.9444393508755845, + "learning_rate": 1.1113963509672688e-05, + "loss": 0.9478, + "mean_token_accuracy": 0.707587081193924, + "num_tokens": 256139438.0, + "step": 103010 + }, + { + "epoch": 0.9445310351150638, + "learning_rate": 1.109562666177684e-05, + "loss": 0.9507, + "mean_token_accuracy": 0.7156376719474793, + "num_tokens": 256166230.0, + "step": 103020 + }, + { + "epoch": 0.944622719354543, + "learning_rate": 1.1077289813880996e-05, + "loss": 0.9391, + "mean_token_accuracy": 0.7084162771701813, + "num_tokens": 256195537.0, + "step": 103030 + }, + { + "epoch": 0.9447144035940221, + "learning_rate": 1.1058952965985147e-05, + "loss": 0.9257, + "mean_token_accuracy": 0.7145484566688538, + "num_tokens": 256223271.0, + "step": 103040 + }, + { + "epoch": 0.9448060878335014, + "learning_rate": 1.1040616118089301e-05, + "loss": 0.9578, + "mean_token_accuracy": 0.708631718158722, + "num_tokens": 256250945.0, + "step": 103050 + }, + { + "epoch": 0.9448977720729806, + "learning_rate": 1.1022279270193455e-05, + "loss": 0.9471, + "mean_token_accuracy": 0.7148377418518066, + "num_tokens": 256278424.0, + "step": 103060 + }, + { + "epoch": 0.9449894563124599, + "learning_rate": 1.1003942422297606e-05, + "loss": 0.948, + "mean_token_accuracy": 0.712054181098938, + "num_tokens": 256306208.0, + "step": 103070 + }, + { + "epoch": 0.9450811405519391, + "learning_rate": 1.0985605574401762e-05, + "loss": 0.9452, + "mean_token_accuracy": 0.7049896419048309, + "num_tokens": 256334342.0, + "step": 103080 + }, + { + "epoch": 0.9451728247914184, + "learning_rate": 1.0967268726505914e-05, + "loss": 0.9564, + "mean_token_accuracy": 0.7121441900730133, + "num_tokens": 256362039.0, + "step": 103090 + }, + { + "epoch": 0.9452645090308975, + "learning_rate": 1.0948931878610067e-05, + "loss": 0.9535, + "mean_token_accuracy": 0.7116735219955445, + "num_tokens": 256390405.0, + "step": 103100 + }, + { + "epoch": 0.9453561932703768, + "learning_rate": 1.093059503071422e-05, + "loss": 0.9444, + "mean_token_accuracy": 0.7108181834220886, + "num_tokens": 256417494.0, + "step": 103110 + }, + { + "epoch": 0.945447877509856, + "learning_rate": 1.0912258182818374e-05, + "loss": 0.9486, + "mean_token_accuracy": 0.714609807729721, + "num_tokens": 256445639.0, + "step": 103120 + }, + { + "epoch": 0.9455395617493353, + "learning_rate": 1.0893921334922528e-05, + "loss": 0.9675, + "mean_token_accuracy": 0.7062018990516663, + "num_tokens": 256474701.0, + "step": 103130 + }, + { + "epoch": 0.9456312459888145, + "learning_rate": 1.0875584487026681e-05, + "loss": 0.9765, + "mean_token_accuracy": 0.7075938940048218, + "num_tokens": 256502867.0, + "step": 103140 + }, + { + "epoch": 0.9457229302282938, + "learning_rate": 1.0857247639130833e-05, + "loss": 0.9737, + "mean_token_accuracy": 0.7039482593536377, + "num_tokens": 256530942.0, + "step": 103150 + }, + { + "epoch": 0.945814614467773, + "learning_rate": 1.0838910791234987e-05, + "loss": 0.9747, + "mean_token_accuracy": 0.7098252058029175, + "num_tokens": 256559324.0, + "step": 103160 + }, + { + "epoch": 0.9459062987072522, + "learning_rate": 1.082057394333914e-05, + "loss": 0.9916, + "mean_token_accuracy": 0.6999709665775299, + "num_tokens": 256587536.0, + "step": 103170 + }, + { + "epoch": 0.9459979829467314, + "learning_rate": 1.0802237095443294e-05, + "loss": 0.9436, + "mean_token_accuracy": 0.7075395107269287, + "num_tokens": 256615740.0, + "step": 103180 + }, + { + "epoch": 0.9460896671862107, + "learning_rate": 1.0783900247547447e-05, + "loss": 0.9468, + "mean_token_accuracy": 0.7163018643856048, + "num_tokens": 256643101.0, + "step": 103190 + }, + { + "epoch": 0.9461813514256899, + "learning_rate": 1.07655633996516e-05, + "loss": 0.9785, + "mean_token_accuracy": 0.7065538823604584, + "num_tokens": 256671159.0, + "step": 103200 + }, + { + "epoch": 0.9462730356651692, + "learning_rate": 1.0747226551755755e-05, + "loss": 0.9701, + "mean_token_accuracy": 0.7056053638458252, + "num_tokens": 256698939.0, + "step": 103210 + }, + { + "epoch": 0.9463647199046484, + "learning_rate": 1.0728889703859906e-05, + "loss": 0.9811, + "mean_token_accuracy": 0.7037706851959229, + "num_tokens": 256727759.0, + "step": 103220 + }, + { + "epoch": 0.9464564041441276, + "learning_rate": 1.071055285596406e-05, + "loss": 0.9543, + "mean_token_accuracy": 0.7111855804920196, + "num_tokens": 256754783.0, + "step": 103230 + }, + { + "epoch": 0.9465480883836068, + "learning_rate": 1.0692216008068214e-05, + "loss": 0.9585, + "mean_token_accuracy": 0.7117890298366547, + "num_tokens": 256782722.0, + "step": 103240 + }, + { + "epoch": 0.9466397726230861, + "learning_rate": 1.0673879160172367e-05, + "loss": 0.9238, + "mean_token_accuracy": 0.7099150657653809, + "num_tokens": 256810530.0, + "step": 103250 + }, + { + "epoch": 0.9467314568625653, + "learning_rate": 1.065554231227652e-05, + "loss": 0.9325, + "mean_token_accuracy": 0.7152824342250824, + "num_tokens": 256838939.0, + "step": 103260 + }, + { + "epoch": 0.9468231411020446, + "learning_rate": 1.0637205464380673e-05, + "loss": 0.9652, + "mean_token_accuracy": 0.7128736257553101, + "num_tokens": 256866720.0, + "step": 103270 + }, + { + "epoch": 0.9469148253415238, + "learning_rate": 1.0618868616484826e-05, + "loss": 0.9292, + "mean_token_accuracy": 0.7194776773452759, + "num_tokens": 256894357.0, + "step": 103280 + }, + { + "epoch": 0.9470065095810031, + "learning_rate": 1.060053176858898e-05, + "loss": 0.9609, + "mean_token_accuracy": 0.7091909885406494, + "num_tokens": 256921804.0, + "step": 103290 + }, + { + "epoch": 0.9470981938204822, + "learning_rate": 1.0582194920693133e-05, + "loss": 0.9423, + "mean_token_accuracy": 0.7118369340896606, + "num_tokens": 256949732.0, + "step": 103300 + }, + { + "epoch": 0.9471898780599615, + "learning_rate": 1.0563858072797287e-05, + "loss": 0.9768, + "mean_token_accuracy": 0.7053621292114258, + "num_tokens": 256977435.0, + "step": 103310 + }, + { + "epoch": 0.9472815622994407, + "learning_rate": 1.054552122490144e-05, + "loss": 0.9483, + "mean_token_accuracy": 0.7116852819919586, + "num_tokens": 257004798.0, + "step": 103320 + }, + { + "epoch": 0.94737324653892, + "learning_rate": 1.0527184377005592e-05, + "loss": 0.9697, + "mean_token_accuracy": 0.7076071083545685, + "num_tokens": 257032795.0, + "step": 103330 + }, + { + "epoch": 0.9474649307783992, + "learning_rate": 1.0508847529109748e-05, + "loss": 0.9503, + "mean_token_accuracy": 0.7118573665618897, + "num_tokens": 257060989.0, + "step": 103340 + }, + { + "epoch": 0.9475566150178785, + "learning_rate": 1.04905106812139e-05, + "loss": 0.965, + "mean_token_accuracy": 0.7086583495140075, + "num_tokens": 257089396.0, + "step": 103350 + }, + { + "epoch": 0.9476482992573576, + "learning_rate": 1.0472173833318053e-05, + "loss": 0.9412, + "mean_token_accuracy": 0.7133853733539581, + "num_tokens": 257117707.0, + "step": 103360 + }, + { + "epoch": 0.9477399834968369, + "learning_rate": 1.0453836985422207e-05, + "loss": 0.9491, + "mean_token_accuracy": 0.7088606655597687, + "num_tokens": 257145689.0, + "step": 103370 + }, + { + "epoch": 0.9478316677363161, + "learning_rate": 1.0435500137526358e-05, + "loss": 0.9344, + "mean_token_accuracy": 0.7158215522766114, + "num_tokens": 257174306.0, + "step": 103380 + }, + { + "epoch": 0.9479233519757954, + "learning_rate": 1.0417163289630514e-05, + "loss": 0.9179, + "mean_token_accuracy": 0.7221521854400634, + "num_tokens": 257202398.0, + "step": 103390 + }, + { + "epoch": 0.9480150362152746, + "learning_rate": 1.0398826441734666e-05, + "loss": 0.9549, + "mean_token_accuracy": 0.7112609088420868, + "num_tokens": 257230126.0, + "step": 103400 + }, + { + "epoch": 0.9481067204547539, + "learning_rate": 1.038048959383882e-05, + "loss": 0.9357, + "mean_token_accuracy": 0.7162086427211761, + "num_tokens": 257257389.0, + "step": 103410 + }, + { + "epoch": 0.9481984046942331, + "learning_rate": 1.0362152745942973e-05, + "loss": 0.9562, + "mean_token_accuracy": 0.7039444208145141, + "num_tokens": 257284823.0, + "step": 103420 + }, + { + "epoch": 0.9482900889337122, + "learning_rate": 1.0343815898047126e-05, + "loss": 0.9677, + "mean_token_accuracy": 0.7077718138694763, + "num_tokens": 257312928.0, + "step": 103430 + }, + { + "epoch": 0.9483817731731915, + "learning_rate": 1.032547905015128e-05, + "loss": 0.943, + "mean_token_accuracy": 0.7146332323551178, + "num_tokens": 257340869.0, + "step": 103440 + }, + { + "epoch": 0.9484734574126708, + "learning_rate": 1.0307142202255433e-05, + "loss": 0.9522, + "mean_token_accuracy": 0.7099611103534699, + "num_tokens": 257369527.0, + "step": 103450 + }, + { + "epoch": 0.94856514165215, + "learning_rate": 1.0288805354359587e-05, + "loss": 0.9468, + "mean_token_accuracy": 0.7089724659919738, + "num_tokens": 257397140.0, + "step": 103460 + }, + { + "epoch": 0.9486568258916293, + "learning_rate": 1.0270468506463739e-05, + "loss": 0.9767, + "mean_token_accuracy": 0.7073847889900208, + "num_tokens": 257425107.0, + "step": 103470 + }, + { + "epoch": 0.9487485101311085, + "learning_rate": 1.0252131658567892e-05, + "loss": 0.9364, + "mean_token_accuracy": 0.712783819437027, + "num_tokens": 257453099.0, + "step": 103480 + }, + { + "epoch": 0.9488401943705876, + "learning_rate": 1.0233794810672046e-05, + "loss": 0.9565, + "mean_token_accuracy": 0.7080893158912659, + "num_tokens": 257480863.0, + "step": 103490 + }, + { + "epoch": 0.9489318786100669, + "learning_rate": 1.02154579627762e-05, + "loss": 0.945, + "mean_token_accuracy": 0.7114560902118683, + "num_tokens": 257509350.0, + "step": 103500 + }, + { + "epoch": 0.9490235628495461, + "learning_rate": 1.0197121114880353e-05, + "loss": 0.9153, + "mean_token_accuracy": 0.7201562821865082, + "num_tokens": 257538072.0, + "step": 103510 + }, + { + "epoch": 0.9491152470890254, + "learning_rate": 1.0178784266984507e-05, + "loss": 0.9306, + "mean_token_accuracy": 0.7134028077125549, + "num_tokens": 257566075.0, + "step": 103520 + }, + { + "epoch": 0.9492069313285046, + "learning_rate": 1.0160447419088658e-05, + "loss": 0.9646, + "mean_token_accuracy": 0.711558175086975, + "num_tokens": 257593780.0, + "step": 103530 + }, + { + "epoch": 0.9492986155679839, + "learning_rate": 1.0142110571192814e-05, + "loss": 0.9591, + "mean_token_accuracy": 0.711041659116745, + "num_tokens": 257621778.0, + "step": 103540 + }, + { + "epoch": 0.9493902998074631, + "learning_rate": 1.0123773723296966e-05, + "loss": 0.9593, + "mean_token_accuracy": 0.7107082903385162, + "num_tokens": 257649639.0, + "step": 103550 + }, + { + "epoch": 0.9494819840469423, + "learning_rate": 1.0105436875401119e-05, + "loss": 0.9894, + "mean_token_accuracy": 0.7032026469707489, + "num_tokens": 257677953.0, + "step": 103560 + }, + { + "epoch": 0.9495736682864215, + "learning_rate": 1.0087100027505273e-05, + "loss": 0.9577, + "mean_token_accuracy": 0.7094796299934387, + "num_tokens": 257706411.0, + "step": 103570 + }, + { + "epoch": 0.9496653525259008, + "learning_rate": 1.0068763179609425e-05, + "loss": 0.9493, + "mean_token_accuracy": 0.7116182744503021, + "num_tokens": 257735209.0, + "step": 103580 + }, + { + "epoch": 0.94975703676538, + "learning_rate": 1.005042633171358e-05, + "loss": 0.9616, + "mean_token_accuracy": 0.7038978099822998, + "num_tokens": 257763694.0, + "step": 103590 + }, + { + "epoch": 0.9498487210048593, + "learning_rate": 1.0032089483817732e-05, + "loss": 0.943, + "mean_token_accuracy": 0.7120588600635529, + "num_tokens": 257791616.0, + "step": 103600 + }, + { + "epoch": 0.9499404052443385, + "learning_rate": 1.0013752635921885e-05, + "loss": 0.9589, + "mean_token_accuracy": 0.7063844621181488, + "num_tokens": 257819375.0, + "step": 103610 + }, + { + "epoch": 0.9500320894838177, + "learning_rate": 9.995415788026039e-06, + "loss": 0.929, + "mean_token_accuracy": 0.7149990439414978, + "num_tokens": 257846476.0, + "step": 103620 + }, + { + "epoch": 0.9501237737232969, + "learning_rate": 9.977078940130192e-06, + "loss": 0.9526, + "mean_token_accuracy": 0.7108969807624816, + "num_tokens": 257874735.0, + "step": 103630 + }, + { + "epoch": 0.9502154579627762, + "learning_rate": 9.958742092234346e-06, + "loss": 0.9784, + "mean_token_accuracy": 0.7079266607761383, + "num_tokens": 257902304.0, + "step": 103640 + }, + { + "epoch": 0.9503071422022554, + "learning_rate": 9.9404052443385e-06, + "loss": 0.9779, + "mean_token_accuracy": 0.7078679800033569, + "num_tokens": 257931179.0, + "step": 103650 + }, + { + "epoch": 0.9503988264417347, + "learning_rate": 9.922068396442651e-06, + "loss": 0.962, + "mean_token_accuracy": 0.7135915398597718, + "num_tokens": 257959103.0, + "step": 103660 + }, + { + "epoch": 0.9504905106812139, + "learning_rate": 9.903731548546805e-06, + "loss": 0.9377, + "mean_token_accuracy": 0.7142771303653717, + "num_tokens": 257986710.0, + "step": 103670 + }, + { + "epoch": 0.9505821949206932, + "learning_rate": 9.885394700650958e-06, + "loss": 0.9879, + "mean_token_accuracy": 0.7014545917510986, + "num_tokens": 258014745.0, + "step": 103680 + }, + { + "epoch": 0.9506738791601723, + "learning_rate": 9.867057852755112e-06, + "loss": 0.9633, + "mean_token_accuracy": 0.7079756379127502, + "num_tokens": 258042307.0, + "step": 103690 + }, + { + "epoch": 0.9507655633996516, + "learning_rate": 9.848721004859266e-06, + "loss": 0.9506, + "mean_token_accuracy": 0.7097310304641724, + "num_tokens": 258071402.0, + "step": 103700 + }, + { + "epoch": 0.9508572476391308, + "learning_rate": 9.830384156963417e-06, + "loss": 0.9473, + "mean_token_accuracy": 0.7122018277645111, + "num_tokens": 258099658.0, + "step": 103710 + }, + { + "epoch": 0.9509489318786101, + "learning_rate": 9.812047309067573e-06, + "loss": 0.9514, + "mean_token_accuracy": 0.7135707855224609, + "num_tokens": 258127085.0, + "step": 103720 + }, + { + "epoch": 0.9510406161180893, + "learning_rate": 9.793710461171725e-06, + "loss": 0.9441, + "mean_token_accuracy": 0.7074814796447754, + "num_tokens": 258155995.0, + "step": 103730 + }, + { + "epoch": 0.9511323003575686, + "learning_rate": 9.775373613275878e-06, + "loss": 0.9696, + "mean_token_accuracy": 0.7047323524951935, + "num_tokens": 258183360.0, + "step": 103740 + }, + { + "epoch": 0.9512239845970478, + "learning_rate": 9.757036765380032e-06, + "loss": 0.9555, + "mean_token_accuracy": 0.7139915108680726, + "num_tokens": 258210942.0, + "step": 103750 + }, + { + "epoch": 0.951315668836527, + "learning_rate": 9.738699917484185e-06, + "loss": 0.9254, + "mean_token_accuracy": 0.717748486995697, + "num_tokens": 258239633.0, + "step": 103760 + }, + { + "epoch": 0.9514073530760062, + "learning_rate": 9.720363069588339e-06, + "loss": 0.9686, + "mean_token_accuracy": 0.7114035665988923, + "num_tokens": 258266974.0, + "step": 103770 + }, + { + "epoch": 0.9514990373154855, + "learning_rate": 9.70202622169249e-06, + "loss": 0.9671, + "mean_token_accuracy": 0.7076778531074523, + "num_tokens": 258294246.0, + "step": 103780 + }, + { + "epoch": 0.9515907215549647, + "learning_rate": 9.683689373796644e-06, + "loss": 0.9433, + "mean_token_accuracy": 0.7101082801818848, + "num_tokens": 258323185.0, + "step": 103790 + }, + { + "epoch": 0.951682405794444, + "learning_rate": 9.665352525900798e-06, + "loss": 0.9746, + "mean_token_accuracy": 0.7070024132728576, + "num_tokens": 258351205.0, + "step": 103800 + }, + { + "epoch": 0.9517740900339232, + "learning_rate": 9.647015678004951e-06, + "loss": 0.9463, + "mean_token_accuracy": 0.715484869480133, + "num_tokens": 258378655.0, + "step": 103810 + }, + { + "epoch": 0.9518657742734024, + "learning_rate": 9.628678830109105e-06, + "loss": 0.9428, + "mean_token_accuracy": 0.7091742873191833, + "num_tokens": 258406924.0, + "step": 103820 + }, + { + "epoch": 0.9519574585128816, + "learning_rate": 9.610341982213258e-06, + "loss": 0.9439, + "mean_token_accuracy": 0.7174428999423981, + "num_tokens": 258434029.0, + "step": 103830 + }, + { + "epoch": 0.9520491427523609, + "learning_rate": 9.59200513431741e-06, + "loss": 0.9685, + "mean_token_accuracy": 0.7059837639331817, + "num_tokens": 258461863.0, + "step": 103840 + }, + { + "epoch": 0.9521408269918401, + "learning_rate": 9.573668286421566e-06, + "loss": 0.9689, + "mean_token_accuracy": 0.7063271284103394, + "num_tokens": 258490273.0, + "step": 103850 + }, + { + "epoch": 0.9522325112313194, + "learning_rate": 9.555331438525717e-06, + "loss": 0.9458, + "mean_token_accuracy": 0.7109232485294342, + "num_tokens": 258517609.0, + "step": 103860 + }, + { + "epoch": 0.9523241954707986, + "learning_rate": 9.536994590629871e-06, + "loss": 0.9717, + "mean_token_accuracy": 0.7070327520370483, + "num_tokens": 258545184.0, + "step": 103870 + }, + { + "epoch": 0.9524158797102779, + "learning_rate": 9.518657742734025e-06, + "loss": 0.9157, + "mean_token_accuracy": 0.7196493923664093, + "num_tokens": 258572310.0, + "step": 103880 + }, + { + "epoch": 0.952507563949757, + "learning_rate": 9.500320894838176e-06, + "loss": 0.9544, + "mean_token_accuracy": 0.7129814445972442, + "num_tokens": 258601242.0, + "step": 103890 + }, + { + "epoch": 0.9525992481892362, + "learning_rate": 9.481984046942332e-06, + "loss": 0.9386, + "mean_token_accuracy": 0.7104416191577911, + "num_tokens": 258628772.0, + "step": 103900 + }, + { + "epoch": 0.9526909324287155, + "learning_rate": 9.463647199046484e-06, + "loss": 0.9517, + "mean_token_accuracy": 0.7113486289978027, + "num_tokens": 258656102.0, + "step": 103910 + }, + { + "epoch": 0.9527826166681947, + "learning_rate": 9.445310351150637e-06, + "loss": 0.9578, + "mean_token_accuracy": 0.7102086842060089, + "num_tokens": 258683737.0, + "step": 103920 + }, + { + "epoch": 0.952874300907674, + "learning_rate": 9.42697350325479e-06, + "loss": 0.9755, + "mean_token_accuracy": 0.7076316356658936, + "num_tokens": 258712208.0, + "step": 103930 + }, + { + "epoch": 0.9529659851471532, + "learning_rate": 9.408636655358944e-06, + "loss": 0.941, + "mean_token_accuracy": 0.7127200841903687, + "num_tokens": 258740392.0, + "step": 103940 + }, + { + "epoch": 0.9530576693866324, + "learning_rate": 9.390299807463098e-06, + "loss": 0.9295, + "mean_token_accuracy": 0.7164123833179474, + "num_tokens": 258768852.0, + "step": 103950 + }, + { + "epoch": 0.9531493536261116, + "learning_rate": 9.371962959567251e-06, + "loss": 0.9206, + "mean_token_accuracy": 0.7147091567516327, + "num_tokens": 258796594.0, + "step": 103960 + }, + { + "epoch": 0.9532410378655909, + "learning_rate": 9.353626111671405e-06, + "loss": 0.9584, + "mean_token_accuracy": 0.7077657818794251, + "num_tokens": 258824947.0, + "step": 103970 + }, + { + "epoch": 0.9533327221050701, + "learning_rate": 9.335289263775557e-06, + "loss": 0.9542, + "mean_token_accuracy": 0.7099952220916748, + "num_tokens": 258852795.0, + "step": 103980 + }, + { + "epoch": 0.9534244063445494, + "learning_rate": 9.31695241587971e-06, + "loss": 0.9696, + "mean_token_accuracy": 0.7050184786319733, + "num_tokens": 258880797.0, + "step": 103990 + }, + { + "epoch": 0.9535160905840286, + "learning_rate": 9.298615567983864e-06, + "loss": 0.9578, + "mean_token_accuracy": 0.7135156214237213, + "num_tokens": 258907358.0, + "step": 104000 + }, + { + "epoch": 0.9536077748235079, + "learning_rate": 9.280278720088018e-06, + "loss": 0.9527, + "mean_token_accuracy": 0.7083232760429382, + "num_tokens": 258936386.0, + "step": 104010 + }, + { + "epoch": 0.953699459062987, + "learning_rate": 9.261941872192171e-06, + "loss": 0.9294, + "mean_token_accuracy": 0.7145907461643219, + "num_tokens": 258963604.0, + "step": 104020 + }, + { + "epoch": 0.9537911433024663, + "learning_rate": 9.243605024296325e-06, + "loss": 0.9783, + "mean_token_accuracy": 0.7060829818248748, + "num_tokens": 258990818.0, + "step": 104030 + }, + { + "epoch": 0.9538828275419455, + "learning_rate": 9.225268176400477e-06, + "loss": 0.9476, + "mean_token_accuracy": 0.7087313115596772, + "num_tokens": 259018300.0, + "step": 104040 + }, + { + "epoch": 0.9539745117814248, + "learning_rate": 9.206931328504632e-06, + "loss": 0.9471, + "mean_token_accuracy": 0.7067500948905945, + "num_tokens": 259046198.0, + "step": 104050 + }, + { + "epoch": 0.954066196020904, + "learning_rate": 9.188594480608784e-06, + "loss": 0.9529, + "mean_token_accuracy": 0.7083405673503875, + "num_tokens": 259074383.0, + "step": 104060 + }, + { + "epoch": 0.9541578802603833, + "learning_rate": 9.170257632712937e-06, + "loss": 0.9646, + "mean_token_accuracy": 0.7116964161396027, + "num_tokens": 259101842.0, + "step": 104070 + }, + { + "epoch": 0.9542495644998624, + "learning_rate": 9.15192078481709e-06, + "loss": 0.9598, + "mean_token_accuracy": 0.709268081188202, + "num_tokens": 259131262.0, + "step": 104080 + }, + { + "epoch": 0.9543412487393417, + "learning_rate": 9.133583936921243e-06, + "loss": 0.9474, + "mean_token_accuracy": 0.711880898475647, + "num_tokens": 259159972.0, + "step": 104090 + }, + { + "epoch": 0.9544329329788209, + "learning_rate": 9.115247089025398e-06, + "loss": 0.954, + "mean_token_accuracy": 0.7128210484981536, + "num_tokens": 259186961.0, + "step": 104100 + }, + { + "epoch": 0.9545246172183002, + "learning_rate": 9.09691024112955e-06, + "loss": 0.9587, + "mean_token_accuracy": 0.7122468411922455, + "num_tokens": 259215286.0, + "step": 104110 + }, + { + "epoch": 0.9546163014577794, + "learning_rate": 9.078573393233703e-06, + "loss": 0.9072, + "mean_token_accuracy": 0.7194814205169677, + "num_tokens": 259242399.0, + "step": 104120 + }, + { + "epoch": 0.9547079856972587, + "learning_rate": 9.060236545337857e-06, + "loss": 0.9426, + "mean_token_accuracy": 0.7142708241939545, + "num_tokens": 259269298.0, + "step": 104130 + }, + { + "epoch": 0.9547996699367379, + "learning_rate": 9.04189969744201e-06, + "loss": 0.9368, + "mean_token_accuracy": 0.7143619596958161, + "num_tokens": 259296549.0, + "step": 104140 + }, + { + "epoch": 0.9548913541762171, + "learning_rate": 9.023562849546164e-06, + "loss": 0.9814, + "mean_token_accuracy": 0.7055559635162354, + "num_tokens": 259325831.0, + "step": 104150 + }, + { + "epoch": 0.9549830384156963, + "learning_rate": 9.005226001650318e-06, + "loss": 0.9528, + "mean_token_accuracy": 0.7074734926223755, + "num_tokens": 259353912.0, + "step": 104160 + }, + { + "epoch": 0.9550747226551756, + "learning_rate": 8.98688915375447e-06, + "loss": 0.9498, + "mean_token_accuracy": 0.7051776826381684, + "num_tokens": 259382346.0, + "step": 104170 + }, + { + "epoch": 0.9551664068946548, + "learning_rate": 8.968552305858623e-06, + "loss": 0.9475, + "mean_token_accuracy": 0.7156764984130859, + "num_tokens": 259411168.0, + "step": 104180 + }, + { + "epoch": 0.9552580911341341, + "learning_rate": 8.950215457962777e-06, + "loss": 0.945, + "mean_token_accuracy": 0.7124345541000366, + "num_tokens": 259439682.0, + "step": 104190 + }, + { + "epoch": 0.9553497753736133, + "learning_rate": 8.93187861006693e-06, + "loss": 0.9625, + "mean_token_accuracy": 0.7090458929538727, + "num_tokens": 259467899.0, + "step": 104200 + }, + { + "epoch": 0.9554414596130925, + "learning_rate": 8.913541762171084e-06, + "loss": 0.9432, + "mean_token_accuracy": 0.7154362559318542, + "num_tokens": 259496247.0, + "step": 104210 + }, + { + "epoch": 0.9555331438525717, + "learning_rate": 8.895204914275236e-06, + "loss": 0.986, + "mean_token_accuracy": 0.7031678676605224, + "num_tokens": 259524253.0, + "step": 104220 + }, + { + "epoch": 0.955624828092051, + "learning_rate": 8.87686806637939e-06, + "loss": 0.9524, + "mean_token_accuracy": 0.7027429163455963, + "num_tokens": 259552243.0, + "step": 104230 + }, + { + "epoch": 0.9557165123315302, + "learning_rate": 8.858531218483543e-06, + "loss": 0.9664, + "mean_token_accuracy": 0.71009481549263, + "num_tokens": 259579815.0, + "step": 104240 + }, + { + "epoch": 0.9558081965710095, + "learning_rate": 8.840194370587696e-06, + "loss": 0.9498, + "mean_token_accuracy": 0.7081762790679932, + "num_tokens": 259607855.0, + "step": 104250 + }, + { + "epoch": 0.9558998808104887, + "learning_rate": 8.82185752269185e-06, + "loss": 0.9328, + "mean_token_accuracy": 0.7151672303676605, + "num_tokens": 259635978.0, + "step": 104260 + }, + { + "epoch": 0.955991565049968, + "learning_rate": 8.803520674796003e-06, + "loss": 0.9514, + "mean_token_accuracy": 0.7089860737323761, + "num_tokens": 259663824.0, + "step": 104270 + }, + { + "epoch": 0.9560832492894471, + "learning_rate": 8.785183826900157e-06, + "loss": 0.9286, + "mean_token_accuracy": 0.7175964951515198, + "num_tokens": 259691232.0, + "step": 104280 + }, + { + "epoch": 0.9561749335289264, + "learning_rate": 8.766846979004309e-06, + "loss": 0.97, + "mean_token_accuracy": 0.7069647789001465, + "num_tokens": 259719031.0, + "step": 104290 + }, + { + "epoch": 0.9562666177684056, + "learning_rate": 8.748510131108462e-06, + "loss": 0.9523, + "mean_token_accuracy": 0.7097716927528381, + "num_tokens": 259746249.0, + "step": 104300 + }, + { + "epoch": 0.9563583020078849, + "learning_rate": 8.730173283212616e-06, + "loss": 0.955, + "mean_token_accuracy": 0.7088623106479645, + "num_tokens": 259767504.0, + "step": 104310 + }, + { + "epoch": 0.9564499862473641, + "learning_rate": 8.71183643531677e-06, + "loss": 0.9427, + "mean_token_accuracy": 0.711846262216568, + "num_tokens": 259794682.0, + "step": 104320 + }, + { + "epoch": 0.9565416704868434, + "learning_rate": 8.693499587420923e-06, + "loss": 0.937, + "mean_token_accuracy": 0.7208527982234955, + "num_tokens": 259822354.0, + "step": 104330 + }, + { + "epoch": 0.9566333547263225, + "learning_rate": 8.675162739525077e-06, + "loss": 1.0061, + "mean_token_accuracy": 0.700165057182312, + "num_tokens": 259850180.0, + "step": 104340 + }, + { + "epoch": 0.9567250389658017, + "learning_rate": 8.656825891629228e-06, + "loss": 0.9694, + "mean_token_accuracy": 0.7124208092689515, + "num_tokens": 259877507.0, + "step": 104350 + }, + { + "epoch": 0.956816723205281, + "learning_rate": 8.638489043733384e-06, + "loss": 0.9335, + "mean_token_accuracy": 0.7144210040569305, + "num_tokens": 259905768.0, + "step": 104360 + }, + { + "epoch": 0.9569084074447602, + "learning_rate": 8.620152195837536e-06, + "loss": 0.9622, + "mean_token_accuracy": 0.7091310858726502, + "num_tokens": 259933653.0, + "step": 104370 + }, + { + "epoch": 0.9570000916842395, + "learning_rate": 8.601815347941689e-06, + "loss": 0.9641, + "mean_token_accuracy": 0.7072034657001496, + "num_tokens": 259961990.0, + "step": 104380 + }, + { + "epoch": 0.9570917759237187, + "learning_rate": 8.583478500045843e-06, + "loss": 0.9313, + "mean_token_accuracy": 0.7128926217556, + "num_tokens": 259988734.0, + "step": 104390 + }, + { + "epoch": 0.957183460163198, + "learning_rate": 8.565141652149995e-06, + "loss": 0.9676, + "mean_token_accuracy": 0.7056384682655334, + "num_tokens": 260017025.0, + "step": 104400 + }, + { + "epoch": 0.9572751444026771, + "learning_rate": 8.54680480425415e-06, + "loss": 0.9444, + "mean_token_accuracy": 0.7095074772834777, + "num_tokens": 260044921.0, + "step": 104410 + }, + { + "epoch": 0.9573668286421564, + "learning_rate": 8.528467956358302e-06, + "loss": 0.95, + "mean_token_accuracy": 0.7101873934268952, + "num_tokens": 260072620.0, + "step": 104420 + }, + { + "epoch": 0.9574585128816356, + "learning_rate": 8.510131108462455e-06, + "loss": 0.9375, + "mean_token_accuracy": 0.7134177446365356, + "num_tokens": 260100351.0, + "step": 104430 + }, + { + "epoch": 0.9575501971211149, + "learning_rate": 8.491794260566609e-06, + "loss": 0.9624, + "mean_token_accuracy": 0.7066910684108734, + "num_tokens": 260128389.0, + "step": 104440 + }, + { + "epoch": 0.9576418813605941, + "learning_rate": 8.473457412670762e-06, + "loss": 0.933, + "mean_token_accuracy": 0.7151216864585876, + "num_tokens": 260156546.0, + "step": 104450 + }, + { + "epoch": 0.9577335656000734, + "learning_rate": 8.455120564774916e-06, + "loss": 0.9883, + "mean_token_accuracy": 0.704510647058487, + "num_tokens": 260185019.0, + "step": 104460 + }, + { + "epoch": 0.9578252498395525, + "learning_rate": 8.43678371687907e-06, + "loss": 0.9482, + "mean_token_accuracy": 0.7077221691608429, + "num_tokens": 260213293.0, + "step": 104470 + }, + { + "epoch": 0.9579169340790318, + "learning_rate": 8.418446868983221e-06, + "loss": 0.9332, + "mean_token_accuracy": 0.7108700573444366, + "num_tokens": 260241811.0, + "step": 104480 + }, + { + "epoch": 0.958008618318511, + "learning_rate": 8.400110021087375e-06, + "loss": 0.9649, + "mean_token_accuracy": 0.7052967786788941, + "num_tokens": 260269445.0, + "step": 104490 + }, + { + "epoch": 0.9581003025579903, + "learning_rate": 8.381773173191528e-06, + "loss": 0.9279, + "mean_token_accuracy": 0.716957277059555, + "num_tokens": 260297199.0, + "step": 104500 + }, + { + "epoch": 0.9581919867974695, + "learning_rate": 8.363436325295682e-06, + "loss": 0.9542, + "mean_token_accuracy": 0.71466823220253, + "num_tokens": 260325191.0, + "step": 104510 + }, + { + "epoch": 0.9582836710369488, + "learning_rate": 8.345099477399836e-06, + "loss": 0.9847, + "mean_token_accuracy": 0.6977778315544129, + "num_tokens": 260353127.0, + "step": 104520 + }, + { + "epoch": 0.958375355276428, + "learning_rate": 8.326762629503987e-06, + "loss": 0.9426, + "mean_token_accuracy": 0.7164582431316375, + "num_tokens": 260380751.0, + "step": 104530 + }, + { + "epoch": 0.9584670395159072, + "learning_rate": 8.308425781608143e-06, + "loss": 0.9342, + "mean_token_accuracy": 0.717404443025589, + "num_tokens": 260407954.0, + "step": 104540 + }, + { + "epoch": 0.9585587237553864, + "learning_rate": 8.290088933712295e-06, + "loss": 0.9328, + "mean_token_accuracy": 0.7158634006977082, + "num_tokens": 260435911.0, + "step": 104550 + }, + { + "epoch": 0.9586504079948657, + "learning_rate": 8.27175208581645e-06, + "loss": 0.9257, + "mean_token_accuracy": 0.7167222380638123, + "num_tokens": 260463609.0, + "step": 104560 + }, + { + "epoch": 0.9587420922343449, + "learning_rate": 8.253415237920602e-06, + "loss": 0.9509, + "mean_token_accuracy": 0.7157267689704895, + "num_tokens": 260491648.0, + "step": 104570 + }, + { + "epoch": 0.9588337764738242, + "learning_rate": 8.235078390024755e-06, + "loss": 0.9423, + "mean_token_accuracy": 0.7102207064628601, + "num_tokens": 260519458.0, + "step": 104580 + }, + { + "epoch": 0.9589254607133034, + "learning_rate": 8.216741542128909e-06, + "loss": 0.9458, + "mean_token_accuracy": 0.7071184813976288, + "num_tokens": 260547608.0, + "step": 104590 + }, + { + "epoch": 0.9590171449527826, + "learning_rate": 8.19840469423306e-06, + "loss": 0.9482, + "mean_token_accuracy": 0.7091720163822174, + "num_tokens": 260575430.0, + "step": 104600 + }, + { + "epoch": 0.9591088291922618, + "learning_rate": 8.180067846337216e-06, + "loss": 0.9689, + "mean_token_accuracy": 0.7091881632804871, + "num_tokens": 260603092.0, + "step": 104610 + }, + { + "epoch": 0.9592005134317411, + "learning_rate": 8.161730998441368e-06, + "loss": 0.9404, + "mean_token_accuracy": 0.7148373484611511, + "num_tokens": 260630793.0, + "step": 104620 + }, + { + "epoch": 0.9592921976712203, + "learning_rate": 8.143394150545521e-06, + "loss": 0.9567, + "mean_token_accuracy": 0.7130004167556763, + "num_tokens": 260658365.0, + "step": 104630 + }, + { + "epoch": 0.9593838819106996, + "learning_rate": 8.125057302649675e-06, + "loss": 0.9447, + "mean_token_accuracy": 0.7086138665676117, + "num_tokens": 260685867.0, + "step": 104640 + }, + { + "epoch": 0.9594755661501788, + "learning_rate": 8.106720454753829e-06, + "loss": 0.9401, + "mean_token_accuracy": 0.7134073853492737, + "num_tokens": 260713414.0, + "step": 104650 + }, + { + "epoch": 0.9595672503896581, + "learning_rate": 8.088383606857982e-06, + "loss": 0.9656, + "mean_token_accuracy": 0.7081871271133423, + "num_tokens": 260740940.0, + "step": 104660 + }, + { + "epoch": 0.9596589346291372, + "learning_rate": 8.070046758962136e-06, + "loss": 0.96, + "mean_token_accuracy": 0.7073591411113739, + "num_tokens": 260769025.0, + "step": 104670 + }, + { + "epoch": 0.9597506188686165, + "learning_rate": 8.051709911066288e-06, + "loss": 0.9348, + "mean_token_accuracy": 0.7133885443210601, + "num_tokens": 260796858.0, + "step": 104680 + }, + { + "epoch": 0.9598423031080957, + "learning_rate": 8.033373063170441e-06, + "loss": 0.9303, + "mean_token_accuracy": 0.7136583507061005, + "num_tokens": 260824880.0, + "step": 104690 + }, + { + "epoch": 0.959933987347575, + "learning_rate": 8.015036215274595e-06, + "loss": 0.9415, + "mean_token_accuracy": 0.7110433340072632, + "num_tokens": 260853167.0, + "step": 104700 + }, + { + "epoch": 0.9600256715870542, + "learning_rate": 7.996699367378748e-06, + "loss": 0.9731, + "mean_token_accuracy": 0.7005956888198852, + "num_tokens": 260881834.0, + "step": 104710 + }, + { + "epoch": 0.9601173558265335, + "learning_rate": 7.978362519482902e-06, + "loss": 0.9598, + "mean_token_accuracy": 0.710364180803299, + "num_tokens": 260909873.0, + "step": 104720 + }, + { + "epoch": 0.9602090400660126, + "learning_rate": 7.960025671587054e-06, + "loss": 0.9535, + "mean_token_accuracy": 0.708672821521759, + "num_tokens": 260938189.0, + "step": 104730 + }, + { + "epoch": 0.9603007243054918, + "learning_rate": 7.941688823691209e-06, + "loss": 0.9752, + "mean_token_accuracy": 0.7049290001392364, + "num_tokens": 260966413.0, + "step": 104740 + }, + { + "epoch": 0.9603924085449711, + "learning_rate": 7.92335197579536e-06, + "loss": 1.0027, + "mean_token_accuracy": 0.6991028249263763, + "num_tokens": 260995689.0, + "step": 104750 + }, + { + "epoch": 0.9604840927844503, + "learning_rate": 7.905015127899514e-06, + "loss": 0.9393, + "mean_token_accuracy": 0.717213100194931, + "num_tokens": 261023409.0, + "step": 104760 + }, + { + "epoch": 0.9605757770239296, + "learning_rate": 7.886678280003668e-06, + "loss": 0.973, + "mean_token_accuracy": 0.7059387028217315, + "num_tokens": 261051734.0, + "step": 104770 + }, + { + "epoch": 0.9606674612634089, + "learning_rate": 7.868341432107821e-06, + "loss": 0.9709, + "mean_token_accuracy": 0.7021915435791015, + "num_tokens": 261080014.0, + "step": 104780 + }, + { + "epoch": 0.9607591455028881, + "learning_rate": 7.850004584211975e-06, + "loss": 0.9611, + "mean_token_accuracy": 0.7105751633644104, + "num_tokens": 261106989.0, + "step": 104790 + }, + { + "epoch": 0.9608508297423672, + "learning_rate": 7.831667736316127e-06, + "loss": 0.9339, + "mean_token_accuracy": 0.7151186645030976, + "num_tokens": 261135728.0, + "step": 104800 + }, + { + "epoch": 0.9609425139818465, + "learning_rate": 7.81333088842028e-06, + "loss": 0.9809, + "mean_token_accuracy": 0.7078758299350738, + "num_tokens": 261164127.0, + "step": 104810 + }, + { + "epoch": 0.9610341982213257, + "learning_rate": 7.794994040524434e-06, + "loss": 0.9533, + "mean_token_accuracy": 0.7144318103790284, + "num_tokens": 261192070.0, + "step": 104820 + }, + { + "epoch": 0.961125882460805, + "learning_rate": 7.776657192628588e-06, + "loss": 0.9378, + "mean_token_accuracy": 0.7188721597194672, + "num_tokens": 261219868.0, + "step": 104830 + }, + { + "epoch": 0.9612175667002842, + "learning_rate": 7.758320344732741e-06, + "loss": 0.9592, + "mean_token_accuracy": 0.714866328239441, + "num_tokens": 261247594.0, + "step": 104840 + }, + { + "epoch": 0.9613092509397635, + "learning_rate": 7.739983496836895e-06, + "loss": 0.9672, + "mean_token_accuracy": 0.7044365048408509, + "num_tokens": 261275505.0, + "step": 104850 + }, + { + "epoch": 0.9614009351792426, + "learning_rate": 7.721646648941047e-06, + "loss": 0.9351, + "mean_token_accuracy": 0.710863733291626, + "num_tokens": 261304391.0, + "step": 104860 + }, + { + "epoch": 0.9614926194187219, + "learning_rate": 7.703309801045202e-06, + "loss": 0.9576, + "mean_token_accuracy": 0.7064379572868347, + "num_tokens": 261331377.0, + "step": 104870 + }, + { + "epoch": 0.9615843036582011, + "learning_rate": 7.684972953149354e-06, + "loss": 0.9644, + "mean_token_accuracy": 0.7093068182468414, + "num_tokens": 261358620.0, + "step": 104880 + }, + { + "epoch": 0.9616759878976804, + "learning_rate": 7.666636105253507e-06, + "loss": 0.9472, + "mean_token_accuracy": 0.7095429003238678, + "num_tokens": 261387075.0, + "step": 104890 + }, + { + "epoch": 0.9617676721371596, + "learning_rate": 7.64829925735766e-06, + "loss": 0.9816, + "mean_token_accuracy": 0.7029368340969085, + "num_tokens": 261415523.0, + "step": 104900 + }, + { + "epoch": 0.9618593563766389, + "learning_rate": 7.629962409461813e-06, + "loss": 0.9659, + "mean_token_accuracy": 0.7069908022880554, + "num_tokens": 261443811.0, + "step": 104910 + }, + { + "epoch": 0.9619510406161181, + "learning_rate": 7.611625561565967e-06, + "loss": 0.941, + "mean_token_accuracy": 0.7135602593421936, + "num_tokens": 261471413.0, + "step": 104920 + }, + { + "epoch": 0.9620427248555973, + "learning_rate": 7.59328871367012e-06, + "loss": 0.9446, + "mean_token_accuracy": 0.7059894621372222, + "num_tokens": 261499435.0, + "step": 104930 + }, + { + "epoch": 0.9621344090950765, + "learning_rate": 7.574951865774274e-06, + "loss": 0.9864, + "mean_token_accuracy": 0.702091658115387, + "num_tokens": 261527461.0, + "step": 104940 + }, + { + "epoch": 0.9622260933345558, + "learning_rate": 7.556615017878427e-06, + "loss": 0.9681, + "mean_token_accuracy": 0.7039337754249573, + "num_tokens": 261555566.0, + "step": 104950 + }, + { + "epoch": 0.962317777574035, + "learning_rate": 7.5382781699825805e-06, + "loss": 0.9608, + "mean_token_accuracy": 0.7046442866325379, + "num_tokens": 261584279.0, + "step": 104960 + }, + { + "epoch": 0.9624094618135143, + "learning_rate": 7.519941322086733e-06, + "loss": 0.9809, + "mean_token_accuracy": 0.7080289125442505, + "num_tokens": 261612065.0, + "step": 104970 + }, + { + "epoch": 0.9625011460529935, + "learning_rate": 7.501604474190888e-06, + "loss": 0.9794, + "mean_token_accuracy": 0.7039623856544495, + "num_tokens": 261639937.0, + "step": 104980 + }, + { + "epoch": 0.9625928302924728, + "learning_rate": 7.48326762629504e-06, + "loss": 0.952, + "mean_token_accuracy": 0.7151970744132996, + "num_tokens": 261667681.0, + "step": 104990 + }, + { + "epoch": 0.9626845145319519, + "learning_rate": 7.464930778399193e-06, + "loss": 0.9684, + "mean_token_accuracy": 0.7099954128265381, + "num_tokens": 261695653.0, + "step": 105000 + }, + { + "epoch": 0.9627761987714312, + "learning_rate": 7.4465939305033466e-06, + "loss": 0.9435, + "mean_token_accuracy": 0.7093705058097839, + "num_tokens": 261724006.0, + "step": 105010 + }, + { + "epoch": 0.9628678830109104, + "learning_rate": 7.428257082607499e-06, + "loss": 0.9607, + "mean_token_accuracy": 0.7109884142875671, + "num_tokens": 261752799.0, + "step": 105020 + }, + { + "epoch": 0.9629595672503897, + "learning_rate": 7.409920234711654e-06, + "loss": 0.9432, + "mean_token_accuracy": 0.7140044867992401, + "num_tokens": 261780743.0, + "step": 105030 + }, + { + "epoch": 0.9630512514898689, + "learning_rate": 7.391583386815806e-06, + "loss": 0.9481, + "mean_token_accuracy": 0.7099042296409607, + "num_tokens": 261808303.0, + "step": 105040 + }, + { + "epoch": 0.9631429357293482, + "learning_rate": 7.37324653891996e-06, + "loss": 0.9544, + "mean_token_accuracy": 0.7053620159626007, + "num_tokens": 261836709.0, + "step": 105050 + }, + { + "epoch": 0.9632346199688273, + "learning_rate": 7.354909691024113e-06, + "loss": 0.927, + "mean_token_accuracy": 0.7229625821113587, + "num_tokens": 261863968.0, + "step": 105060 + }, + { + "epoch": 0.9633263042083066, + "learning_rate": 7.336572843128267e-06, + "loss": 0.9511, + "mean_token_accuracy": 0.7075356125831604, + "num_tokens": 261891478.0, + "step": 105070 + }, + { + "epoch": 0.9634179884477858, + "learning_rate": 7.31823599523242e-06, + "loss": 0.9783, + "mean_token_accuracy": 0.7071390867233276, + "num_tokens": 261919917.0, + "step": 105080 + }, + { + "epoch": 0.9635096726872651, + "learning_rate": 7.299899147336574e-06, + "loss": 0.9461, + "mean_token_accuracy": 0.7109041452407837, + "num_tokens": 261948322.0, + "step": 105090 + }, + { + "epoch": 0.9636013569267443, + "learning_rate": 7.281562299440726e-06, + "loss": 0.9438, + "mean_token_accuracy": 0.7165783166885376, + "num_tokens": 261975145.0, + "step": 105100 + }, + { + "epoch": 0.9636930411662236, + "learning_rate": 7.263225451544879e-06, + "loss": 0.9446, + "mean_token_accuracy": 0.7081939458847046, + "num_tokens": 262003039.0, + "step": 105110 + }, + { + "epoch": 0.9637847254057028, + "learning_rate": 7.244888603649033e-06, + "loss": 0.9325, + "mean_token_accuracy": 0.7147288918495178, + "num_tokens": 262030580.0, + "step": 105120 + }, + { + "epoch": 0.963876409645182, + "learning_rate": 7.226551755753186e-06, + "loss": 0.9625, + "mean_token_accuracy": 0.7078769147396088, + "num_tokens": 262058695.0, + "step": 105130 + }, + { + "epoch": 0.9639680938846612, + "learning_rate": 7.20821490785734e-06, + "loss": 0.9357, + "mean_token_accuracy": 0.7082073032855988, + "num_tokens": 262086304.0, + "step": 105140 + }, + { + "epoch": 0.9640597781241405, + "learning_rate": 7.189878059961492e-06, + "loss": 0.9531, + "mean_token_accuracy": 0.7161878883838654, + "num_tokens": 262114218.0, + "step": 105150 + }, + { + "epoch": 0.9641514623636197, + "learning_rate": 7.171541212065647e-06, + "loss": 0.9298, + "mean_token_accuracy": 0.7189928710460662, + "num_tokens": 262142632.0, + "step": 105160 + }, + { + "epoch": 0.964243146603099, + "learning_rate": 7.153204364169799e-06, + "loss": 0.9334, + "mean_token_accuracy": 0.7166423559188843, + "num_tokens": 262171540.0, + "step": 105170 + }, + { + "epoch": 0.9643348308425782, + "learning_rate": 7.134867516273954e-06, + "loss": 0.9293, + "mean_token_accuracy": 0.7156631767749786, + "num_tokens": 262198739.0, + "step": 105180 + }, + { + "epoch": 0.9644265150820573, + "learning_rate": 7.1165306683781064e-06, + "loss": 0.9675, + "mean_token_accuracy": 0.7043153405189514, + "num_tokens": 262226147.0, + "step": 105190 + }, + { + "epoch": 0.9645181993215366, + "learning_rate": 7.09819382048226e-06, + "loss": 0.9573, + "mean_token_accuracy": 0.7088045179843903, + "num_tokens": 262254458.0, + "step": 105200 + }, + { + "epoch": 0.9646098835610158, + "learning_rate": 7.079856972586413e-06, + "loss": 0.9581, + "mean_token_accuracy": 0.7146477222442627, + "num_tokens": 262283339.0, + "step": 105210 + }, + { + "epoch": 0.9647015678004951, + "learning_rate": 7.0615201246905654e-06, + "loss": 0.9447, + "mean_token_accuracy": 0.7116816759109497, + "num_tokens": 262311967.0, + "step": 105220 + }, + { + "epoch": 0.9647932520399743, + "learning_rate": 7.04318327679472e-06, + "loss": 0.9443, + "mean_token_accuracy": 0.7132414698600769, + "num_tokens": 262339962.0, + "step": 105230 + }, + { + "epoch": 0.9648849362794536, + "learning_rate": 7.0248464288988726e-06, + "loss": 0.9504, + "mean_token_accuracy": 0.7133159816265107, + "num_tokens": 262368672.0, + "step": 105240 + }, + { + "epoch": 0.9649766205189328, + "learning_rate": 7.006509581003026e-06, + "loss": 0.9547, + "mean_token_accuracy": 0.7095539152622223, + "num_tokens": 262396747.0, + "step": 105250 + }, + { + "epoch": 0.965068304758412, + "learning_rate": 6.988172733107179e-06, + "loss": 0.9724, + "mean_token_accuracy": 0.7134536623954773, + "num_tokens": 262424982.0, + "step": 105260 + }, + { + "epoch": 0.9651599889978912, + "learning_rate": 6.969835885211333e-06, + "loss": 0.9258, + "mean_token_accuracy": 0.7163802027702332, + "num_tokens": 262452977.0, + "step": 105270 + }, + { + "epoch": 0.9652516732373705, + "learning_rate": 6.951499037315486e-06, + "loss": 0.9448, + "mean_token_accuracy": 0.7127069056034088, + "num_tokens": 262481087.0, + "step": 105280 + }, + { + "epoch": 0.9653433574768497, + "learning_rate": 6.9331621894196395e-06, + "loss": 0.957, + "mean_token_accuracy": 0.7055570185184479, + "num_tokens": 262508553.0, + "step": 105290 + }, + { + "epoch": 0.965435041716329, + "learning_rate": 6.914825341523792e-06, + "loss": 0.9393, + "mean_token_accuracy": 0.710353285074234, + "num_tokens": 262535151.0, + "step": 105300 + }, + { + "epoch": 0.9655267259558082, + "learning_rate": 6.896488493627945e-06, + "loss": 0.9435, + "mean_token_accuracy": 0.7103923082351684, + "num_tokens": 262562783.0, + "step": 105310 + }, + { + "epoch": 0.9656184101952874, + "learning_rate": 6.878151645732099e-06, + "loss": 0.9524, + "mean_token_accuracy": 0.7078456401824951, + "num_tokens": 262591205.0, + "step": 105320 + }, + { + "epoch": 0.9657100944347666, + "learning_rate": 6.859814797836252e-06, + "loss": 0.9518, + "mean_token_accuracy": 0.7144934654235839, + "num_tokens": 262619282.0, + "step": 105330 + }, + { + "epoch": 0.9658017786742459, + "learning_rate": 6.841477949940406e-06, + "loss": 0.9788, + "mean_token_accuracy": 0.7054666340351105, + "num_tokens": 262647481.0, + "step": 105340 + }, + { + "epoch": 0.9658934629137251, + "learning_rate": 6.823141102044558e-06, + "loss": 0.9646, + "mean_token_accuracy": 0.7075164198875428, + "num_tokens": 262675147.0, + "step": 105350 + }, + { + "epoch": 0.9659851471532044, + "learning_rate": 6.804804254148713e-06, + "loss": 0.9408, + "mean_token_accuracy": 0.7170015037059784, + "num_tokens": 262702677.0, + "step": 105360 + }, + { + "epoch": 0.9660768313926836, + "learning_rate": 6.7864674062528655e-06, + "loss": 0.95, + "mean_token_accuracy": 0.7101018011569977, + "num_tokens": 262731098.0, + "step": 105370 + }, + { + "epoch": 0.9661685156321629, + "learning_rate": 6.768130558357019e-06, + "loss": 0.9564, + "mean_token_accuracy": 0.7104446828365326, + "num_tokens": 262759224.0, + "step": 105380 + }, + { + "epoch": 0.966260199871642, + "learning_rate": 6.749793710461172e-06, + "loss": 0.9706, + "mean_token_accuracy": 0.7109690129756927, + "num_tokens": 262786028.0, + "step": 105390 + }, + { + "epoch": 0.9663518841111213, + "learning_rate": 6.731456862565326e-06, + "loss": 0.9449, + "mean_token_accuracy": 0.7134011149406433, + "num_tokens": 262813623.0, + "step": 105400 + }, + { + "epoch": 0.9664435683506005, + "learning_rate": 6.713120014669479e-06, + "loss": 0.9664, + "mean_token_accuracy": 0.7101104557514191, + "num_tokens": 262841230.0, + "step": 105410 + }, + { + "epoch": 0.9665352525900798, + "learning_rate": 6.694783166773632e-06, + "loss": 0.9366, + "mean_token_accuracy": 0.7136660933494567, + "num_tokens": 262869144.0, + "step": 105420 + }, + { + "epoch": 0.966626936829559, + "learning_rate": 6.676446318877785e-06, + "loss": 0.9469, + "mean_token_accuracy": 0.7105951428413391, + "num_tokens": 262897349.0, + "step": 105430 + }, + { + "epoch": 0.9667186210690383, + "learning_rate": 6.658109470981938e-06, + "loss": 0.9895, + "mean_token_accuracy": 0.7003681600093842, + "num_tokens": 262925732.0, + "step": 105440 + }, + { + "epoch": 0.9668103053085174, + "learning_rate": 6.639772623086092e-06, + "loss": 0.9481, + "mean_token_accuracy": 0.7137551486492157, + "num_tokens": 262953066.0, + "step": 105450 + }, + { + "epoch": 0.9669019895479967, + "learning_rate": 6.621435775190245e-06, + "loss": 0.9664, + "mean_token_accuracy": 0.7069268226623535, + "num_tokens": 262980482.0, + "step": 105460 + }, + { + "epoch": 0.9669936737874759, + "learning_rate": 6.6030989272943985e-06, + "loss": 0.9718, + "mean_token_accuracy": 0.7009297668933868, + "num_tokens": 263008269.0, + "step": 105470 + }, + { + "epoch": 0.9670853580269552, + "learning_rate": 6.584762079398551e-06, + "loss": 0.9595, + "mean_token_accuracy": 0.7061017990112305, + "num_tokens": 263037066.0, + "step": 105480 + }, + { + "epoch": 0.9671770422664344, + "learning_rate": 6.566425231502706e-06, + "loss": 0.9384, + "mean_token_accuracy": 0.7098778247833252, + "num_tokens": 263064869.0, + "step": 105490 + }, + { + "epoch": 0.9672687265059137, + "learning_rate": 6.548088383606858e-06, + "loss": 0.9452, + "mean_token_accuracy": 0.7145616352558136, + "num_tokens": 263092062.0, + "step": 105500 + }, + { + "epoch": 0.9673604107453929, + "learning_rate": 6.529751535711012e-06, + "loss": 0.9376, + "mean_token_accuracy": 0.7121304333209991, + "num_tokens": 263120349.0, + "step": 105510 + }, + { + "epoch": 0.9674520949848721, + "learning_rate": 6.511414687815165e-06, + "loss": 0.9398, + "mean_token_accuracy": 0.7116935789585114, + "num_tokens": 263148407.0, + "step": 105520 + }, + { + "epoch": 0.9675437792243513, + "learning_rate": 6.493077839919317e-06, + "loss": 0.9463, + "mean_token_accuracy": 0.7124622941017151, + "num_tokens": 263176388.0, + "step": 105530 + }, + { + "epoch": 0.9676354634638306, + "learning_rate": 6.474740992023472e-06, + "loss": 0.9404, + "mean_token_accuracy": 0.708881276845932, + "num_tokens": 263204048.0, + "step": 105540 + }, + { + "epoch": 0.9677271477033098, + "learning_rate": 6.4564041441276245e-06, + "loss": 0.9435, + "mean_token_accuracy": 0.7130149960517883, + "num_tokens": 263232383.0, + "step": 105550 + }, + { + "epoch": 0.9678188319427891, + "learning_rate": 6.438067296231778e-06, + "loss": 0.9235, + "mean_token_accuracy": 0.718024605512619, + "num_tokens": 263260435.0, + "step": 105560 + }, + { + "epoch": 0.9679105161822683, + "learning_rate": 6.419730448335931e-06, + "loss": 0.9416, + "mean_token_accuracy": 0.7133037686347962, + "num_tokens": 263286886.0, + "step": 105570 + }, + { + "epoch": 0.9680022004217474, + "learning_rate": 6.401393600440085e-06, + "loss": 0.9785, + "mean_token_accuracy": 0.7028957009315491, + "num_tokens": 263314053.0, + "step": 105580 + }, + { + "epoch": 0.9680938846612267, + "learning_rate": 6.383056752544238e-06, + "loss": 0.9432, + "mean_token_accuracy": 0.7095845997333526, + "num_tokens": 263341797.0, + "step": 105590 + }, + { + "epoch": 0.968185568900706, + "learning_rate": 6.3647199046483915e-06, + "loss": 0.9373, + "mean_token_accuracy": 0.7112450778484345, + "num_tokens": 263369146.0, + "step": 105600 + }, + { + "epoch": 0.9682772531401852, + "learning_rate": 6.346383056752544e-06, + "loss": 0.9494, + "mean_token_accuracy": 0.7115423262119294, + "num_tokens": 263397012.0, + "step": 105610 + }, + { + "epoch": 0.9683689373796645, + "learning_rate": 6.328046208856697e-06, + "loss": 0.9983, + "mean_token_accuracy": 0.7018362998962402, + "num_tokens": 263424803.0, + "step": 105620 + }, + { + "epoch": 0.9684606216191437, + "learning_rate": 6.309709360960851e-06, + "loss": 0.9581, + "mean_token_accuracy": 0.7116221487522125, + "num_tokens": 263451470.0, + "step": 105630 + }, + { + "epoch": 0.968552305858623, + "learning_rate": 6.291372513065004e-06, + "loss": 0.9268, + "mean_token_accuracy": 0.7161617338657379, + "num_tokens": 263479191.0, + "step": 105640 + }, + { + "epoch": 0.9686439900981021, + "learning_rate": 6.2730356651691576e-06, + "loss": 0.9652, + "mean_token_accuracy": 0.7056613743305207, + "num_tokens": 263507135.0, + "step": 105650 + }, + { + "epoch": 0.9687356743375813, + "learning_rate": 6.25469881727331e-06, + "loss": 0.9407, + "mean_token_accuracy": 0.7149433672428132, + "num_tokens": 263534794.0, + "step": 105660 + }, + { + "epoch": 0.9688273585770606, + "learning_rate": 6.236361969377464e-06, + "loss": 0.962, + "mean_token_accuracy": 0.7107852518558502, + "num_tokens": 263561540.0, + "step": 105670 + }, + { + "epoch": 0.9689190428165398, + "learning_rate": 6.218025121481617e-06, + "loss": 0.9334, + "mean_token_accuracy": 0.7102938771247864, + "num_tokens": 263589535.0, + "step": 105680 + }, + { + "epoch": 0.9690107270560191, + "learning_rate": 6.199688273585771e-06, + "loss": 0.9606, + "mean_token_accuracy": 0.7076380312442779, + "num_tokens": 263617009.0, + "step": 105690 + }, + { + "epoch": 0.9691024112954983, + "learning_rate": 6.181351425689924e-06, + "loss": 0.9445, + "mean_token_accuracy": 0.7133013665676117, + "num_tokens": 263645206.0, + "step": 105700 + }, + { + "epoch": 0.9691940955349775, + "learning_rate": 6.163014577794077e-06, + "loss": 0.9477, + "mean_token_accuracy": 0.7096609771251678, + "num_tokens": 263672933.0, + "step": 105710 + }, + { + "epoch": 0.9692857797744567, + "learning_rate": 6.144677729898231e-06, + "loss": 0.9296, + "mean_token_accuracy": 0.7168624103069305, + "num_tokens": 263701127.0, + "step": 105720 + }, + { + "epoch": 0.969377464013936, + "learning_rate": 6.126340882002384e-06, + "loss": 0.9661, + "mean_token_accuracy": 0.7041217029094696, + "num_tokens": 263729579.0, + "step": 105730 + }, + { + "epoch": 0.9694691482534152, + "learning_rate": 6.108004034106538e-06, + "loss": 0.9826, + "mean_token_accuracy": 0.7042882442474365, + "num_tokens": 263757512.0, + "step": 105740 + }, + { + "epoch": 0.9695608324928945, + "learning_rate": 6.089667186210691e-06, + "loss": 0.9596, + "mean_token_accuracy": 0.7068013250827789, + "num_tokens": 263785390.0, + "step": 105750 + }, + { + "epoch": 0.9696525167323737, + "learning_rate": 6.071330338314844e-06, + "loss": 0.9658, + "mean_token_accuracy": 0.7056807041168213, + "num_tokens": 263813407.0, + "step": 105760 + }, + { + "epoch": 0.969744200971853, + "learning_rate": 6.052993490418997e-06, + "loss": 0.933, + "mean_token_accuracy": 0.7154004454612732, + "num_tokens": 263839629.0, + "step": 105770 + }, + { + "epoch": 0.9698358852113321, + "learning_rate": 6.0346566425231505e-06, + "loss": 0.9253, + "mean_token_accuracy": 0.7129565477371216, + "num_tokens": 263867682.0, + "step": 105780 + }, + { + "epoch": 0.9699275694508114, + "learning_rate": 6.016319794627304e-06, + "loss": 0.9732, + "mean_token_accuracy": 0.7071649730205536, + "num_tokens": 263895853.0, + "step": 105790 + }, + { + "epoch": 0.9700192536902906, + "learning_rate": 5.997982946731457e-06, + "loss": 0.9445, + "mean_token_accuracy": 0.7088455379009246, + "num_tokens": 263924163.0, + "step": 105800 + }, + { + "epoch": 0.9701109379297699, + "learning_rate": 5.97964609883561e-06, + "loss": 0.9721, + "mean_token_accuracy": 0.7049594759941101, + "num_tokens": 263951542.0, + "step": 105810 + }, + { + "epoch": 0.9702026221692491, + "learning_rate": 5.961309250939764e-06, + "loss": 0.968, + "mean_token_accuracy": 0.7079796195030212, + "num_tokens": 263979628.0, + "step": 105820 + }, + { + "epoch": 0.9702943064087284, + "learning_rate": 5.9429724030439174e-06, + "loss": 0.959, + "mean_token_accuracy": 0.7132765114307403, + "num_tokens": 264007484.0, + "step": 105830 + }, + { + "epoch": 0.9703859906482075, + "learning_rate": 5.92463555514807e-06, + "loss": 0.9537, + "mean_token_accuracy": 0.7099129557609558, + "num_tokens": 264036186.0, + "step": 105840 + }, + { + "epoch": 0.9704776748876868, + "learning_rate": 5.906298707252224e-06, + "loss": 0.948, + "mean_token_accuracy": 0.7068579435348511, + "num_tokens": 264063993.0, + "step": 105850 + }, + { + "epoch": 0.970569359127166, + "learning_rate": 5.887961859356377e-06, + "loss": 0.9788, + "mean_token_accuracy": 0.7074842393398285, + "num_tokens": 264091842.0, + "step": 105860 + }, + { + "epoch": 0.9706610433666453, + "learning_rate": 5.86962501146053e-06, + "loss": 0.9667, + "mean_token_accuracy": 0.7055523753166199, + "num_tokens": 264119708.0, + "step": 105870 + }, + { + "epoch": 0.9707527276061245, + "learning_rate": 5.8512881635646836e-06, + "loss": 0.9637, + "mean_token_accuracy": 0.7075406670570373, + "num_tokens": 264147846.0, + "step": 105880 + }, + { + "epoch": 0.9708444118456038, + "learning_rate": 5.832951315668836e-06, + "loss": 0.942, + "mean_token_accuracy": 0.7142965495586395, + "num_tokens": 264175416.0, + "step": 105890 + }, + { + "epoch": 0.970936096085083, + "learning_rate": 5.81461446777299e-06, + "loss": 0.9655, + "mean_token_accuracy": 0.7091979920864105, + "num_tokens": 264203049.0, + "step": 105900 + }, + { + "epoch": 0.9710277803245622, + "learning_rate": 5.796277619877143e-06, + "loss": 0.9635, + "mean_token_accuracy": 0.7098026514053345, + "num_tokens": 264229934.0, + "step": 105910 + }, + { + "epoch": 0.9711194645640414, + "learning_rate": 5.777940771981297e-06, + "loss": 0.9288, + "mean_token_accuracy": 0.7123159825801849, + "num_tokens": 264257309.0, + "step": 105920 + }, + { + "epoch": 0.9712111488035207, + "learning_rate": 5.75960392408545e-06, + "loss": 0.9748, + "mean_token_accuracy": 0.7069181799888611, + "num_tokens": 264284430.0, + "step": 105930 + }, + { + "epoch": 0.9713028330429999, + "learning_rate": 5.741267076189603e-06, + "loss": 0.9513, + "mean_token_accuracy": 0.7107536494731903, + "num_tokens": 264312628.0, + "step": 105940 + }, + { + "epoch": 0.9713945172824792, + "learning_rate": 5.722930228293757e-06, + "loss": 0.9587, + "mean_token_accuracy": 0.7086152553558349, + "num_tokens": 264341729.0, + "step": 105950 + }, + { + "epoch": 0.9714862015219584, + "learning_rate": 5.70459338039791e-06, + "loss": 0.9469, + "mean_token_accuracy": 0.7136449694633484, + "num_tokens": 264369762.0, + "step": 105960 + }, + { + "epoch": 0.9715778857614376, + "learning_rate": 5.686256532502064e-06, + "loss": 0.9527, + "mean_token_accuracy": 0.7097286641597748, + "num_tokens": 264396983.0, + "step": 105970 + }, + { + "epoch": 0.9716695700009168, + "learning_rate": 5.667919684606216e-06, + "loss": 0.9564, + "mean_token_accuracy": 0.7044010639190674, + "num_tokens": 264424606.0, + "step": 105980 + }, + { + "epoch": 0.971761254240396, + "learning_rate": 5.649582836710369e-06, + "loss": 0.9512, + "mean_token_accuracy": 0.7110239386558532, + "num_tokens": 264453567.0, + "step": 105990 + }, + { + "epoch": 0.9718529384798753, + "learning_rate": 5.631245988814523e-06, + "loss": 0.939, + "mean_token_accuracy": 0.7180724620819092, + "num_tokens": 264481233.0, + "step": 106000 + }, + { + "epoch": 0.9719446227193546, + "learning_rate": 5.6129091409186765e-06, + "loss": 0.9823, + "mean_token_accuracy": 0.7070731580257416, + "num_tokens": 264508448.0, + "step": 106010 + }, + { + "epoch": 0.9720363069588338, + "learning_rate": 5.59457229302283e-06, + "loss": 0.9581, + "mean_token_accuracy": 0.7078408002853394, + "num_tokens": 264535958.0, + "step": 106020 + }, + { + "epoch": 0.9721279911983131, + "learning_rate": 5.576235445126983e-06, + "loss": 0.9699, + "mean_token_accuracy": 0.7089482188224793, + "num_tokens": 264563452.0, + "step": 106030 + }, + { + "epoch": 0.9722196754377922, + "learning_rate": 5.557898597231136e-06, + "loss": 0.9746, + "mean_token_accuracy": 0.7037977755069733, + "num_tokens": 264591147.0, + "step": 106040 + }, + { + "epoch": 0.9723113596772714, + "learning_rate": 5.53956174933529e-06, + "loss": 0.9537, + "mean_token_accuracy": 0.7138411521911621, + "num_tokens": 264619344.0, + "step": 106050 + }, + { + "epoch": 0.9724030439167507, + "learning_rate": 5.5212249014394434e-06, + "loss": 0.9313, + "mean_token_accuracy": 0.7180680215358735, + "num_tokens": 264647475.0, + "step": 106060 + }, + { + "epoch": 0.97249472815623, + "learning_rate": 5.502888053543596e-06, + "loss": 0.9589, + "mean_token_accuracy": 0.7090674996376037, + "num_tokens": 264674309.0, + "step": 106070 + }, + { + "epoch": 0.9725864123957092, + "learning_rate": 5.484551205647749e-06, + "loss": 0.9751, + "mean_token_accuracy": 0.7034432351589203, + "num_tokens": 264702248.0, + "step": 106080 + }, + { + "epoch": 0.9726780966351884, + "learning_rate": 5.466214357751902e-06, + "loss": 0.9138, + "mean_token_accuracy": 0.7175294697284699, + "num_tokens": 264729778.0, + "step": 106090 + }, + { + "epoch": 0.9727697808746677, + "learning_rate": 5.447877509856056e-06, + "loss": 0.96, + "mean_token_accuracy": 0.7127042353153229, + "num_tokens": 264757489.0, + "step": 106100 + }, + { + "epoch": 0.9728614651141468, + "learning_rate": 5.4295406619602095e-06, + "loss": 0.9158, + "mean_token_accuracy": 0.7221392869949341, + "num_tokens": 264785683.0, + "step": 106110 + }, + { + "epoch": 0.9729531493536261, + "learning_rate": 5.411203814064362e-06, + "loss": 0.9778, + "mean_token_accuracy": 0.7075231373310089, + "num_tokens": 264813270.0, + "step": 106120 + }, + { + "epoch": 0.9730448335931053, + "learning_rate": 5.392866966168516e-06, + "loss": 0.9207, + "mean_token_accuracy": 0.7147023320198059, + "num_tokens": 264840288.0, + "step": 106130 + }, + { + "epoch": 0.9731365178325846, + "learning_rate": 5.374530118272669e-06, + "loss": 0.9514, + "mean_token_accuracy": 0.7081270277500152, + "num_tokens": 264868023.0, + "step": 106140 + }, + { + "epoch": 0.9732282020720638, + "learning_rate": 5.356193270376823e-06, + "loss": 0.9371, + "mean_token_accuracy": 0.7109180867671967, + "num_tokens": 264895408.0, + "step": 106150 + }, + { + "epoch": 0.9733198863115431, + "learning_rate": 5.337856422480976e-06, + "loss": 0.9578, + "mean_token_accuracy": 0.7068678259849548, + "num_tokens": 264922737.0, + "step": 106160 + }, + { + "epoch": 0.9734115705510222, + "learning_rate": 5.319519574585129e-06, + "loss": 0.9543, + "mean_token_accuracy": 0.7071869909763336, + "num_tokens": 264951109.0, + "step": 106170 + }, + { + "epoch": 0.9735032547905015, + "learning_rate": 5.301182726689282e-06, + "loss": 0.9513, + "mean_token_accuracy": 0.711639142036438, + "num_tokens": 264978504.0, + "step": 106180 + }, + { + "epoch": 0.9735949390299807, + "learning_rate": 5.2828458787934355e-06, + "loss": 0.9569, + "mean_token_accuracy": 0.7065433025360107, + "num_tokens": 265006590.0, + "step": 106190 + }, + { + "epoch": 0.97368662326946, + "learning_rate": 5.264509030897589e-06, + "loss": 0.9273, + "mean_token_accuracy": 0.7189335882663727, + "num_tokens": 265035287.0, + "step": 106200 + }, + { + "epoch": 0.9737783075089392, + "learning_rate": 5.246172183001742e-06, + "loss": 0.9557, + "mean_token_accuracy": 0.7066478848457336, + "num_tokens": 265062813.0, + "step": 106210 + }, + { + "epoch": 0.9738699917484185, + "learning_rate": 5.227835335105895e-06, + "loss": 0.9384, + "mean_token_accuracy": 0.7121494829654693, + "num_tokens": 265090979.0, + "step": 106220 + }, + { + "epoch": 0.9739616759878977, + "learning_rate": 5.209498487210049e-06, + "loss": 0.9563, + "mean_token_accuracy": 0.7068563342094422, + "num_tokens": 265118358.0, + "step": 106230 + }, + { + "epoch": 0.9740533602273769, + "learning_rate": 5.1911616393142025e-06, + "loss": 0.9583, + "mean_token_accuracy": 0.7092251658439637, + "num_tokens": 265146472.0, + "step": 106240 + }, + { + "epoch": 0.9741450444668561, + "learning_rate": 5.172824791418355e-06, + "loss": 0.9762, + "mean_token_accuracy": 0.7026823461055756, + "num_tokens": 265174138.0, + "step": 106250 + }, + { + "epoch": 0.9742367287063354, + "learning_rate": 5.154487943522509e-06, + "loss": 0.9571, + "mean_token_accuracy": 0.7108917355537414, + "num_tokens": 265201558.0, + "step": 106260 + }, + { + "epoch": 0.9743284129458146, + "learning_rate": 5.136151095626662e-06, + "loss": 0.965, + "mean_token_accuracy": 0.7082030355930329, + "num_tokens": 265230750.0, + "step": 106270 + }, + { + "epoch": 0.9744200971852939, + "learning_rate": 5.117814247730816e-06, + "loss": 0.9732, + "mean_token_accuracy": 0.7060872912406921, + "num_tokens": 265257747.0, + "step": 106280 + }, + { + "epoch": 0.9745117814247731, + "learning_rate": 5.0994773998349686e-06, + "loss": 0.9595, + "mean_token_accuracy": 0.7112521946430206, + "num_tokens": 265285523.0, + "step": 106290 + }, + { + "epoch": 0.9746034656642523, + "learning_rate": 5.081140551939121e-06, + "loss": 0.9535, + "mean_token_accuracy": 0.7129338502883911, + "num_tokens": 265313178.0, + "step": 106300 + }, + { + "epoch": 0.9746951499037315, + "learning_rate": 5.062803704043275e-06, + "loss": 0.9557, + "mean_token_accuracy": 0.7092982530593872, + "num_tokens": 265340824.0, + "step": 106310 + }, + { + "epoch": 0.9747868341432108, + "learning_rate": 5.044466856147428e-06, + "loss": 0.9406, + "mean_token_accuracy": 0.7075697779655457, + "num_tokens": 265368493.0, + "step": 106320 + }, + { + "epoch": 0.97487851838269, + "learning_rate": 5.026130008251582e-06, + "loss": 0.9494, + "mean_token_accuracy": 0.7144442856311798, + "num_tokens": 265396552.0, + "step": 106330 + }, + { + "epoch": 0.9749702026221693, + "learning_rate": 5.0077931603557355e-06, + "loss": 0.9342, + "mean_token_accuracy": 0.715404623746872, + "num_tokens": 265424256.0, + "step": 106340 + }, + { + "epoch": 0.9750618868616485, + "learning_rate": 4.989456312459888e-06, + "loss": 0.9462, + "mean_token_accuracy": 0.7162149667739868, + "num_tokens": 265451815.0, + "step": 106350 + }, + { + "epoch": 0.9751535711011278, + "learning_rate": 4.971119464564042e-06, + "loss": 0.979, + "mean_token_accuracy": 0.7023785650730133, + "num_tokens": 265480157.0, + "step": 106360 + }, + { + "epoch": 0.9752452553406069, + "learning_rate": 4.952782616668195e-06, + "loss": 0.9623, + "mean_token_accuracy": 0.7010857045650483, + "num_tokens": 265508075.0, + "step": 106370 + }, + { + "epoch": 0.9753369395800862, + "learning_rate": 4.934445768772349e-06, + "loss": 0.9822, + "mean_token_accuracy": 0.7071395516395569, + "num_tokens": 265535857.0, + "step": 106380 + }, + { + "epoch": 0.9754286238195654, + "learning_rate": 4.916108920876502e-06, + "loss": 0.9742, + "mean_token_accuracy": 0.7060118317604065, + "num_tokens": 265563541.0, + "step": 106390 + }, + { + "epoch": 0.9755203080590447, + "learning_rate": 4.897772072980654e-06, + "loss": 0.9035, + "mean_token_accuracy": 0.7206015467643738, + "num_tokens": 265591285.0, + "step": 106400 + }, + { + "epoch": 0.9756119922985239, + "learning_rate": 4.879435225084808e-06, + "loss": 0.9435, + "mean_token_accuracy": 0.7146306753158569, + "num_tokens": 265618805.0, + "step": 106410 + }, + { + "epoch": 0.9757036765380032, + "learning_rate": 4.8610983771889615e-06, + "loss": 0.972, + "mean_token_accuracy": 0.7071013391017914, + "num_tokens": 265647800.0, + "step": 106420 + }, + { + "epoch": 0.9757953607774823, + "learning_rate": 4.842761529293115e-06, + "loss": 0.9456, + "mean_token_accuracy": 0.7121579349040985, + "num_tokens": 265675256.0, + "step": 106430 + }, + { + "epoch": 0.9758870450169616, + "learning_rate": 4.824424681397268e-06, + "loss": 0.9694, + "mean_token_accuracy": 0.7056652307510376, + "num_tokens": 265703943.0, + "step": 106440 + }, + { + "epoch": 0.9759787292564408, + "learning_rate": 4.806087833501421e-06, + "loss": 0.9331, + "mean_token_accuracy": 0.7131913483142853, + "num_tokens": 265731873.0, + "step": 106450 + }, + { + "epoch": 0.97607041349592, + "learning_rate": 4.787750985605575e-06, + "loss": 0.9562, + "mean_token_accuracy": 0.7071906805038453, + "num_tokens": 265759759.0, + "step": 106460 + }, + { + "epoch": 0.9761620977353993, + "learning_rate": 4.7694141377097284e-06, + "loss": 0.9534, + "mean_token_accuracy": 0.7083316087722779, + "num_tokens": 265787275.0, + "step": 106470 + }, + { + "epoch": 0.9762537819748786, + "learning_rate": 4.751077289813881e-06, + "loss": 0.9486, + "mean_token_accuracy": 0.7126296639442444, + "num_tokens": 265815670.0, + "step": 106480 + }, + { + "epoch": 0.9763454662143578, + "learning_rate": 4.732740441918034e-06, + "loss": 0.9639, + "mean_token_accuracy": 0.7070540189743042, + "num_tokens": 265843969.0, + "step": 106490 + }, + { + "epoch": 0.9764371504538369, + "learning_rate": 4.7144035940221874e-06, + "loss": 0.9686, + "mean_token_accuracy": 0.710118442773819, + "num_tokens": 265872055.0, + "step": 106500 + }, + { + "epoch": 0.9765288346933162, + "learning_rate": 4.696066746126341e-06, + "loss": 0.979, + "mean_token_accuracy": 0.7022459447383881, + "num_tokens": 265900485.0, + "step": 106510 + }, + { + "epoch": 0.9766205189327954, + "learning_rate": 4.6777298982304946e-06, + "loss": 0.9562, + "mean_token_accuracy": 0.7102384209632874, + "num_tokens": 265927929.0, + "step": 106520 + }, + { + "epoch": 0.9767122031722747, + "learning_rate": 4.659393050334647e-06, + "loss": 0.9668, + "mean_token_accuracy": 0.7090049982070923, + "num_tokens": 265956047.0, + "step": 106530 + }, + { + "epoch": 0.976803887411754, + "learning_rate": 4.641056202438801e-06, + "loss": 0.9515, + "mean_token_accuracy": 0.709384435415268, + "num_tokens": 265984890.0, + "step": 106540 + }, + { + "epoch": 0.9768955716512332, + "learning_rate": 4.622719354542954e-06, + "loss": 0.9064, + "mean_token_accuracy": 0.7182036519050599, + "num_tokens": 266012722.0, + "step": 106550 + }, + { + "epoch": 0.9769872558907123, + "learning_rate": 4.604382506647108e-06, + "loss": 0.9884, + "mean_token_accuracy": 0.7036374330520629, + "num_tokens": 266041019.0, + "step": 106560 + }, + { + "epoch": 0.9770789401301916, + "learning_rate": 4.5860456587512615e-06, + "loss": 0.9733, + "mean_token_accuracy": 0.7008701801300049, + "num_tokens": 266068470.0, + "step": 106570 + }, + { + "epoch": 0.9771706243696708, + "learning_rate": 4.567708810855414e-06, + "loss": 0.9794, + "mean_token_accuracy": 0.7040487945079803, + "num_tokens": 266096213.0, + "step": 106580 + }, + { + "epoch": 0.9772623086091501, + "learning_rate": 4.549371962959567e-06, + "loss": 0.9669, + "mean_token_accuracy": 0.7039185881614685, + "num_tokens": 266124188.0, + "step": 106590 + }, + { + "epoch": 0.9773539928486293, + "learning_rate": 4.5310351150637205e-06, + "loss": 0.961, + "mean_token_accuracy": 0.7082109749317169, + "num_tokens": 266151873.0, + "step": 106600 + }, + { + "epoch": 0.9774456770881086, + "learning_rate": 4.512698267167874e-06, + "loss": 0.9339, + "mean_token_accuracy": 0.7134939074516297, + "num_tokens": 266179822.0, + "step": 106610 + }, + { + "epoch": 0.9775373613275878, + "learning_rate": 4.494361419272028e-06, + "loss": 0.9337, + "mean_token_accuracy": 0.718496972322464, + "num_tokens": 266208001.0, + "step": 106620 + }, + { + "epoch": 0.977629045567067, + "learning_rate": 4.47602457137618e-06, + "loss": 0.9424, + "mean_token_accuracy": 0.7149182856082916, + "num_tokens": 266236315.0, + "step": 106630 + }, + { + "epoch": 0.9777207298065462, + "learning_rate": 4.457687723480334e-06, + "loss": 0.9821, + "mean_token_accuracy": 0.7090541541576385, + "num_tokens": 266265058.0, + "step": 106640 + }, + { + "epoch": 0.9778124140460255, + "learning_rate": 4.4393508755844875e-06, + "loss": 0.9424, + "mean_token_accuracy": 0.7143906235694886, + "num_tokens": 266292251.0, + "step": 106650 + }, + { + "epoch": 0.9779040982855047, + "learning_rate": 4.421014027688641e-06, + "loss": 0.9228, + "mean_token_accuracy": 0.7171306908130646, + "num_tokens": 266319962.0, + "step": 106660 + }, + { + "epoch": 0.977995782524984, + "learning_rate": 4.402677179792794e-06, + "loss": 0.9609, + "mean_token_accuracy": 0.7086678266525268, + "num_tokens": 266347973.0, + "step": 106670 + }, + { + "epoch": 0.9780874667644632, + "learning_rate": 4.384340331896947e-06, + "loss": 0.9419, + "mean_token_accuracy": 0.7154306769371033, + "num_tokens": 266376650.0, + "step": 106680 + }, + { + "epoch": 0.9781791510039424, + "learning_rate": 4.366003484001101e-06, + "loss": 0.9431, + "mean_token_accuracy": 0.7204812347888947, + "num_tokens": 266404202.0, + "step": 106690 + }, + { + "epoch": 0.9782708352434216, + "learning_rate": 4.347666636105254e-06, + "loss": 0.9713, + "mean_token_accuracy": 0.7069407284259797, + "num_tokens": 266432172.0, + "step": 106700 + }, + { + "epoch": 0.9783625194829009, + "learning_rate": 4.329329788209407e-06, + "loss": 0.9628, + "mean_token_accuracy": 0.7112584054470062, + "num_tokens": 266459803.0, + "step": 106710 + }, + { + "epoch": 0.9784542037223801, + "learning_rate": 4.31099294031356e-06, + "loss": 0.9202, + "mean_token_accuracy": 0.7176357507705688, + "num_tokens": 266488015.0, + "step": 106720 + }, + { + "epoch": 0.9785458879618594, + "learning_rate": 4.292656092417713e-06, + "loss": 0.9538, + "mean_token_accuracy": 0.7114960134029389, + "num_tokens": 266515594.0, + "step": 106730 + }, + { + "epoch": 0.9786375722013386, + "learning_rate": 4.274319244521867e-06, + "loss": 0.9458, + "mean_token_accuracy": 0.7117897689342498, + "num_tokens": 266543314.0, + "step": 106740 + }, + { + "epoch": 0.9787292564408179, + "learning_rate": 4.2559823966260205e-06, + "loss": 0.968, + "mean_token_accuracy": 0.7120352983474731, + "num_tokens": 266571211.0, + "step": 106750 + }, + { + "epoch": 0.978820940680297, + "learning_rate": 4.237645548730173e-06, + "loss": 0.9492, + "mean_token_accuracy": 0.7072612285614014, + "num_tokens": 266599142.0, + "step": 106760 + }, + { + "epoch": 0.9789126249197763, + "learning_rate": 4.219308700834327e-06, + "loss": 0.9631, + "mean_token_accuracy": 0.7073183059692383, + "num_tokens": 266627729.0, + "step": 106770 + }, + { + "epoch": 0.9790043091592555, + "learning_rate": 4.20097185293848e-06, + "loss": 0.9625, + "mean_token_accuracy": 0.7120635509490967, + "num_tokens": 266656536.0, + "step": 106780 + }, + { + "epoch": 0.9790959933987348, + "learning_rate": 4.182635005042634e-06, + "loss": 0.9282, + "mean_token_accuracy": 0.7160631656646729, + "num_tokens": 266684094.0, + "step": 106790 + }, + { + "epoch": 0.979187677638214, + "learning_rate": 4.164298157146787e-06, + "loss": 0.9467, + "mean_token_accuracy": 0.7072149753570557, + "num_tokens": 266712354.0, + "step": 106800 + }, + { + "epoch": 0.9792793618776933, + "learning_rate": 4.145961309250939e-06, + "loss": 0.9457, + "mean_token_accuracy": 0.7111077785491944, + "num_tokens": 266740969.0, + "step": 106810 + }, + { + "epoch": 0.9793710461171724, + "learning_rate": 4.127624461355093e-06, + "loss": 0.9679, + "mean_token_accuracy": 0.7086487650871277, + "num_tokens": 266768822.0, + "step": 106820 + }, + { + "epoch": 0.9794627303566517, + "learning_rate": 4.1092876134592465e-06, + "loss": 0.9465, + "mean_token_accuracy": 0.713647437095642, + "num_tokens": 266795807.0, + "step": 106830 + }, + { + "epoch": 0.9795544145961309, + "learning_rate": 4.0909507655634e-06, + "loss": 0.9546, + "mean_token_accuracy": 0.7055732071399688, + "num_tokens": 266825252.0, + "step": 106840 + }, + { + "epoch": 0.9796460988356102, + "learning_rate": 4.072613917667553e-06, + "loss": 0.936, + "mean_token_accuracy": 0.7111010015010834, + "num_tokens": 266854538.0, + "step": 106850 + }, + { + "epoch": 0.9797377830750894, + "learning_rate": 4.054277069771706e-06, + "loss": 0.9588, + "mean_token_accuracy": 0.7043581068515777, + "num_tokens": 266882684.0, + "step": 106860 + }, + { + "epoch": 0.9798294673145687, + "learning_rate": 4.03594022187586e-06, + "loss": 0.9505, + "mean_token_accuracy": 0.7151164412498474, + "num_tokens": 266911360.0, + "step": 106870 + }, + { + "epoch": 0.9799211515540479, + "learning_rate": 4.0176033739800135e-06, + "loss": 0.9509, + "mean_token_accuracy": 0.7084515392780304, + "num_tokens": 266939420.0, + "step": 106880 + }, + { + "epoch": 0.980012835793527, + "learning_rate": 3.999266526084167e-06, + "loss": 0.9493, + "mean_token_accuracy": 0.7123298645019531, + "num_tokens": 266967245.0, + "step": 106890 + }, + { + "epoch": 0.9801045200330063, + "learning_rate": 3.980929678188319e-06, + "loss": 0.9588, + "mean_token_accuracy": 0.7104962050914765, + "num_tokens": 266994626.0, + "step": 106900 + }, + { + "epoch": 0.9801962042724855, + "learning_rate": 3.9625928302924724e-06, + "loss": 0.9501, + "mean_token_accuracy": 0.7113950729370118, + "num_tokens": 267022198.0, + "step": 106910 + }, + { + "epoch": 0.9802878885119648, + "learning_rate": 3.944255982396626e-06, + "loss": 0.9536, + "mean_token_accuracy": 0.7085495054721832, + "num_tokens": 267050493.0, + "step": 106920 + }, + { + "epoch": 0.980379572751444, + "learning_rate": 3.9259191345007796e-06, + "loss": 0.9789, + "mean_token_accuracy": 0.7024223268032074, + "num_tokens": 267078180.0, + "step": 106930 + }, + { + "epoch": 0.9804712569909233, + "learning_rate": 3.907582286604933e-06, + "loss": 0.9732, + "mean_token_accuracy": 0.7009832084178924, + "num_tokens": 267106692.0, + "step": 106940 + }, + { + "epoch": 0.9805629412304024, + "learning_rate": 3.889245438709086e-06, + "loss": 0.941, + "mean_token_accuracy": 0.7072395741939544, + "num_tokens": 267135277.0, + "step": 106950 + }, + { + "epoch": 0.9806546254698817, + "learning_rate": 3.870908590813239e-06, + "loss": 0.9739, + "mean_token_accuracy": 0.7103749692440033, + "num_tokens": 267163665.0, + "step": 106960 + }, + { + "epoch": 0.9807463097093609, + "learning_rate": 3.852571742917393e-06, + "loss": 0.9434, + "mean_token_accuracy": 0.7175757586956024, + "num_tokens": 267191513.0, + "step": 106970 + }, + { + "epoch": 0.9808379939488402, + "learning_rate": 3.8342348950215465e-06, + "loss": 0.9247, + "mean_token_accuracy": 0.7166262805461884, + "num_tokens": 267219257.0, + "step": 106980 + }, + { + "epoch": 0.9809296781883194, + "learning_rate": 3.815898047125699e-06, + "loss": 0.9671, + "mean_token_accuracy": 0.7055789470672608, + "num_tokens": 267247251.0, + "step": 106990 + }, + { + "epoch": 0.9810213624277987, + "learning_rate": 3.7975611992298524e-06, + "loss": 0.942, + "mean_token_accuracy": 0.7121406674385071, + "num_tokens": 267275112.0, + "step": 107000 + }, + { + "epoch": 0.9811130466672779, + "learning_rate": 3.7792243513340055e-06, + "loss": 0.9329, + "mean_token_accuracy": 0.7172952950000763, + "num_tokens": 267302819.0, + "step": 107010 + }, + { + "epoch": 0.9812047309067571, + "learning_rate": 3.760887503438159e-06, + "loss": 0.9454, + "mean_token_accuracy": 0.7095207214355469, + "num_tokens": 267330985.0, + "step": 107020 + }, + { + "epoch": 0.9812964151462363, + "learning_rate": 3.7425506555423122e-06, + "loss": 0.9647, + "mean_token_accuracy": 0.7062365531921386, + "num_tokens": 267358692.0, + "step": 107030 + }, + { + "epoch": 0.9813880993857156, + "learning_rate": 3.7242138076464658e-06, + "loss": 0.982, + "mean_token_accuracy": 0.7057001054286957, + "num_tokens": 267387786.0, + "step": 107040 + }, + { + "epoch": 0.9814797836251948, + "learning_rate": 3.705876959750619e-06, + "loss": 0.9314, + "mean_token_accuracy": 0.7117950439453125, + "num_tokens": 267416620.0, + "step": 107050 + }, + { + "epoch": 0.9815714678646741, + "learning_rate": 3.6875401118547725e-06, + "loss": 0.9199, + "mean_token_accuracy": 0.7160579800605774, + "num_tokens": 267444554.0, + "step": 107060 + }, + { + "epoch": 0.9816631521041533, + "learning_rate": 3.6692032639589256e-06, + "loss": 0.929, + "mean_token_accuracy": 0.7167559683322906, + "num_tokens": 267472585.0, + "step": 107070 + }, + { + "epoch": 0.9817548363436325, + "learning_rate": 3.650866416063079e-06, + "loss": 0.9428, + "mean_token_accuracy": 0.7125068247318268, + "num_tokens": 267499728.0, + "step": 107080 + }, + { + "epoch": 0.9818465205831117, + "learning_rate": 3.6325295681672323e-06, + "loss": 0.9567, + "mean_token_accuracy": 0.7096069157123566, + "num_tokens": 267527845.0, + "step": 107090 + }, + { + "epoch": 0.981938204822591, + "learning_rate": 3.614192720271386e-06, + "loss": 0.9611, + "mean_token_accuracy": 0.7039044857025146, + "num_tokens": 267555763.0, + "step": 107100 + }, + { + "epoch": 0.9820298890620702, + "learning_rate": 3.5958558723755386e-06, + "loss": 0.9461, + "mean_token_accuracy": 0.7165573835372925, + "num_tokens": 267583758.0, + "step": 107110 + }, + { + "epoch": 0.9821215733015495, + "learning_rate": 3.5775190244796917e-06, + "loss": 0.9668, + "mean_token_accuracy": 0.7083516955375672, + "num_tokens": 267611223.0, + "step": 107120 + }, + { + "epoch": 0.9822132575410287, + "learning_rate": 3.5591821765838453e-06, + "loss": 0.9754, + "mean_token_accuracy": 0.7050501585006714, + "num_tokens": 267639537.0, + "step": 107130 + }, + { + "epoch": 0.982304941780508, + "learning_rate": 3.5408453286879984e-06, + "loss": 0.9538, + "mean_token_accuracy": 0.7140101850032806, + "num_tokens": 267667864.0, + "step": 107140 + }, + { + "epoch": 0.9823966260199871, + "learning_rate": 3.522508480792152e-06, + "loss": 0.9497, + "mean_token_accuracy": 0.7126223623752594, + "num_tokens": 267696208.0, + "step": 107150 + }, + { + "epoch": 0.9824883102594664, + "learning_rate": 3.5041716328963056e-06, + "loss": 0.9257, + "mean_token_accuracy": 0.7188680231571197, + "num_tokens": 267723540.0, + "step": 107160 + }, + { + "epoch": 0.9825799944989456, + "learning_rate": 3.4858347850004587e-06, + "loss": 0.9418, + "mean_token_accuracy": 0.7131708323955536, + "num_tokens": 267750849.0, + "step": 107170 + }, + { + "epoch": 0.9826716787384249, + "learning_rate": 3.4674979371046122e-06, + "loss": 0.9241, + "mean_token_accuracy": 0.715410715341568, + "num_tokens": 267778672.0, + "step": 107180 + }, + { + "epoch": 0.9827633629779041, + "learning_rate": 3.4491610892087654e-06, + "loss": 0.9635, + "mean_token_accuracy": 0.7099226772785187, + "num_tokens": 267806503.0, + "step": 107190 + }, + { + "epoch": 0.9828550472173834, + "learning_rate": 3.430824241312919e-06, + "loss": 0.9219, + "mean_token_accuracy": 0.7198168754577636, + "num_tokens": 267833691.0, + "step": 107200 + }, + { + "epoch": 0.9829467314568625, + "learning_rate": 3.4124873934170717e-06, + "loss": 0.9576, + "mean_token_accuracy": 0.7134953022003174, + "num_tokens": 267862815.0, + "step": 107210 + }, + { + "epoch": 0.9830384156963418, + "learning_rate": 3.394150545521225e-06, + "loss": 0.9451, + "mean_token_accuracy": 0.7121977984905243, + "num_tokens": 267891105.0, + "step": 107220 + }, + { + "epoch": 0.983130099935821, + "learning_rate": 3.3758136976253784e-06, + "loss": 0.9592, + "mean_token_accuracy": 0.7109839439392089, + "num_tokens": 267918486.0, + "step": 107230 + }, + { + "epoch": 0.9832217841753003, + "learning_rate": 3.3574768497295315e-06, + "loss": 0.968, + "mean_token_accuracy": 0.7080407559871673, + "num_tokens": 267946117.0, + "step": 107240 + }, + { + "epoch": 0.9833134684147795, + "learning_rate": 3.339140001833685e-06, + "loss": 0.951, + "mean_token_accuracy": 0.7099920630455017, + "num_tokens": 267973868.0, + "step": 107250 + }, + { + "epoch": 0.9834051526542588, + "learning_rate": 3.320803153937838e-06, + "loss": 0.9451, + "mean_token_accuracy": 0.7140229761600494, + "num_tokens": 268002045.0, + "step": 107260 + }, + { + "epoch": 0.983496836893738, + "learning_rate": 3.3024663060419918e-06, + "loss": 0.9356, + "mean_token_accuracy": 0.7128445625305175, + "num_tokens": 268029878.0, + "step": 107270 + }, + { + "epoch": 0.9835885211332172, + "learning_rate": 3.284129458146145e-06, + "loss": 0.9735, + "mean_token_accuracy": 0.7094855904579163, + "num_tokens": 268058681.0, + "step": 107280 + }, + { + "epoch": 0.9836802053726964, + "learning_rate": 3.2657926102502985e-06, + "loss": 0.9508, + "mean_token_accuracy": 0.7092310309410095, + "num_tokens": 268086448.0, + "step": 107290 + }, + { + "epoch": 0.9837718896121757, + "learning_rate": 3.2474557623544516e-06, + "loss": 0.9507, + "mean_token_accuracy": 0.7072018980979919, + "num_tokens": 268115374.0, + "step": 107300 + }, + { + "epoch": 0.9838635738516549, + "learning_rate": 3.2291189144586043e-06, + "loss": 0.9685, + "mean_token_accuracy": 0.7047235190868377, + "num_tokens": 268142870.0, + "step": 107310 + }, + { + "epoch": 0.9839552580911342, + "learning_rate": 3.210782066562758e-06, + "loss": 0.9689, + "mean_token_accuracy": 0.7041001141071319, + "num_tokens": 268168195.0, + "step": 107320 + }, + { + "epoch": 0.9840469423306134, + "learning_rate": 3.192445218666911e-06, + "loss": 0.9562, + "mean_token_accuracy": 0.712040513753891, + "num_tokens": 268195680.0, + "step": 107330 + }, + { + "epoch": 0.9841386265700927, + "learning_rate": 3.1741083707710646e-06, + "loss": 0.9688, + "mean_token_accuracy": 0.7109183728694916, + "num_tokens": 268223300.0, + "step": 107340 + }, + { + "epoch": 0.9842303108095718, + "learning_rate": 3.1557715228752177e-06, + "loss": 0.9466, + "mean_token_accuracy": 0.7137140512466431, + "num_tokens": 268251991.0, + "step": 107350 + }, + { + "epoch": 0.984321995049051, + "learning_rate": 3.1374346749793713e-06, + "loss": 0.9799, + "mean_token_accuracy": 0.7029484987258912, + "num_tokens": 268279720.0, + "step": 107360 + }, + { + "epoch": 0.9844136792885303, + "learning_rate": 3.1190978270835244e-06, + "loss": 0.9707, + "mean_token_accuracy": 0.7057084023952485, + "num_tokens": 268308437.0, + "step": 107370 + }, + { + "epoch": 0.9845053635280095, + "learning_rate": 3.100760979187678e-06, + "loss": 0.926, + "mean_token_accuracy": 0.7118915379047394, + "num_tokens": 268337074.0, + "step": 107380 + }, + { + "epoch": 0.9845970477674888, + "learning_rate": 3.082424131291831e-06, + "loss": 0.981, + "mean_token_accuracy": 0.7060979902744293, + "num_tokens": 268365336.0, + "step": 107390 + }, + { + "epoch": 0.984688732006968, + "learning_rate": 3.0640872833959843e-06, + "loss": 0.9706, + "mean_token_accuracy": 0.7084679424762725, + "num_tokens": 268392832.0, + "step": 107400 + }, + { + "epoch": 0.9847804162464472, + "learning_rate": 3.045750435500138e-06, + "loss": 0.9551, + "mean_token_accuracy": 0.7108550250530243, + "num_tokens": 268420757.0, + "step": 107410 + }, + { + "epoch": 0.9848721004859264, + "learning_rate": 3.027413587604291e-06, + "loss": 0.9593, + "mean_token_accuracy": 0.70405193567276, + "num_tokens": 268448810.0, + "step": 107420 + }, + { + "epoch": 0.9849637847254057, + "learning_rate": 3.0090767397084445e-06, + "loss": 0.9585, + "mean_token_accuracy": 0.7112325847148895, + "num_tokens": 268476505.0, + "step": 107430 + }, + { + "epoch": 0.9850554689648849, + "learning_rate": 2.9907398918125972e-06, + "loss": 0.9498, + "mean_token_accuracy": 0.7112827479839325, + "num_tokens": 268503902.0, + "step": 107440 + }, + { + "epoch": 0.9851471532043642, + "learning_rate": 2.9724030439167508e-06, + "loss": 0.9677, + "mean_token_accuracy": 0.7116233706474304, + "num_tokens": 268531374.0, + "step": 107450 + }, + { + "epoch": 0.9852388374438434, + "learning_rate": 2.9540661960209043e-06, + "loss": 0.9695, + "mean_token_accuracy": 0.7061333119869232, + "num_tokens": 268559105.0, + "step": 107460 + }, + { + "epoch": 0.9853305216833227, + "learning_rate": 2.9357293481250575e-06, + "loss": 0.959, + "mean_token_accuracy": 0.7100592672824859, + "num_tokens": 268586478.0, + "step": 107470 + }, + { + "epoch": 0.9854222059228018, + "learning_rate": 2.917392500229211e-06, + "loss": 0.9365, + "mean_token_accuracy": 0.7193555891513824, + "num_tokens": 268614547.0, + "step": 107480 + }, + { + "epoch": 0.9855138901622811, + "learning_rate": 2.8990556523333638e-06, + "loss": 0.9314, + "mean_token_accuracy": 0.7129702806472779, + "num_tokens": 268643275.0, + "step": 107490 + }, + { + "epoch": 0.9856055744017603, + "learning_rate": 2.8807188044375173e-06, + "loss": 0.9417, + "mean_token_accuracy": 0.7112998008728028, + "num_tokens": 268671856.0, + "step": 107500 + }, + { + "epoch": 0.9856972586412396, + "learning_rate": 2.8623819565416705e-06, + "loss": 0.9339, + "mean_token_accuracy": 0.7164718568325043, + "num_tokens": 268699381.0, + "step": 107510 + }, + { + "epoch": 0.9857889428807188, + "learning_rate": 2.844045108645824e-06, + "loss": 0.9438, + "mean_token_accuracy": 0.7116261959075928, + "num_tokens": 268727217.0, + "step": 107520 + }, + { + "epoch": 0.9858806271201981, + "learning_rate": 2.825708260749977e-06, + "loss": 0.9288, + "mean_token_accuracy": 0.715890783071518, + "num_tokens": 268754171.0, + "step": 107530 + }, + { + "epoch": 0.9859723113596772, + "learning_rate": 2.8073714128541303e-06, + "loss": 0.9608, + "mean_token_accuracy": 0.7092635333538055, + "num_tokens": 268783298.0, + "step": 107540 + }, + { + "epoch": 0.9860639955991565, + "learning_rate": 2.789034564958284e-06, + "loss": 0.9457, + "mean_token_accuracy": 0.7123358964920044, + "num_tokens": 268811658.0, + "step": 107550 + }, + { + "epoch": 0.9861556798386357, + "learning_rate": 2.770697717062437e-06, + "loss": 0.9387, + "mean_token_accuracy": 0.7104895353317261, + "num_tokens": 268839747.0, + "step": 107560 + }, + { + "epoch": 0.986247364078115, + "learning_rate": 2.7523608691665906e-06, + "loss": 0.9708, + "mean_token_accuracy": 0.7031299591064453, + "num_tokens": 268868105.0, + "step": 107570 + }, + { + "epoch": 0.9863390483175942, + "learning_rate": 2.7340240212707437e-06, + "loss": 0.9189, + "mean_token_accuracy": 0.7171532988548279, + "num_tokens": 268896025.0, + "step": 107580 + }, + { + "epoch": 0.9864307325570735, + "learning_rate": 2.715687173374897e-06, + "loss": 0.9343, + "mean_token_accuracy": 0.7195134341716767, + "num_tokens": 268923445.0, + "step": 107590 + }, + { + "epoch": 0.9865224167965527, + "learning_rate": 2.69735032547905e-06, + "loss": 0.9575, + "mean_token_accuracy": 0.7066919088363648, + "num_tokens": 268950796.0, + "step": 107600 + }, + { + "epoch": 0.9866141010360319, + "learning_rate": 2.6790134775832035e-06, + "loss": 0.9166, + "mean_token_accuracy": 0.7156722962856292, + "num_tokens": 268978990.0, + "step": 107610 + }, + { + "epoch": 0.9867057852755111, + "learning_rate": 2.660676629687357e-06, + "loss": 0.9409, + "mean_token_accuracy": 0.7169091105461121, + "num_tokens": 269007019.0, + "step": 107620 + }, + { + "epoch": 0.9867974695149904, + "learning_rate": 2.6423397817915102e-06, + "loss": 0.9657, + "mean_token_accuracy": 0.7096025884151459, + "num_tokens": 269035085.0, + "step": 107630 + }, + { + "epoch": 0.9868891537544696, + "learning_rate": 2.6240029338956634e-06, + "loss": 0.955, + "mean_token_accuracy": 0.7107065618038177, + "num_tokens": 269063429.0, + "step": 107640 + }, + { + "epoch": 0.9869808379939489, + "learning_rate": 2.6056660859998165e-06, + "loss": 0.9836, + "mean_token_accuracy": 0.7031045734882355, + "num_tokens": 269088747.0, + "step": 107650 + }, + { + "epoch": 0.9870725222334281, + "learning_rate": 2.58732923810397e-06, + "loss": 0.9595, + "mean_token_accuracy": 0.7059447705745697, + "num_tokens": 269116551.0, + "step": 107660 + }, + { + "epoch": 0.9871642064729073, + "learning_rate": 2.5689923902081232e-06, + "loss": 0.9283, + "mean_token_accuracy": 0.7176011502742767, + "num_tokens": 269144389.0, + "step": 107670 + }, + { + "epoch": 0.9872558907123865, + "learning_rate": 2.5506555423122768e-06, + "loss": 0.9474, + "mean_token_accuracy": 0.7118645429611206, + "num_tokens": 269172289.0, + "step": 107680 + }, + { + "epoch": 0.9873475749518658, + "learning_rate": 2.53231869441643e-06, + "loss": 0.9482, + "mean_token_accuracy": 0.7113101065158844, + "num_tokens": 269200845.0, + "step": 107690 + }, + { + "epoch": 0.987439259191345, + "learning_rate": 2.513981846520583e-06, + "loss": 0.9556, + "mean_token_accuracy": 0.7083694040775299, + "num_tokens": 269229350.0, + "step": 107700 + }, + { + "epoch": 0.9875309434308243, + "learning_rate": 2.4956449986247366e-06, + "loss": 0.9351, + "mean_token_accuracy": 0.714234220981598, + "num_tokens": 269257317.0, + "step": 107710 + }, + { + "epoch": 0.9876226276703035, + "learning_rate": 2.4773081507288897e-06, + "loss": 0.9331, + "mean_token_accuracy": 0.7184779822826386, + "num_tokens": 269285084.0, + "step": 107720 + }, + { + "epoch": 0.9877143119097828, + "learning_rate": 2.4589713028330433e-06, + "loss": 0.9617, + "mean_token_accuracy": 0.707352077960968, + "num_tokens": 269313336.0, + "step": 107730 + }, + { + "epoch": 0.9878059961492619, + "learning_rate": 2.4406344549371964e-06, + "loss": 0.9859, + "mean_token_accuracy": 0.6971431612968445, + "num_tokens": 269341414.0, + "step": 107740 + }, + { + "epoch": 0.9878976803887412, + "learning_rate": 2.4222976070413496e-06, + "loss": 0.9717, + "mean_token_accuracy": 0.705696564912796, + "num_tokens": 269369551.0, + "step": 107750 + }, + { + "epoch": 0.9879893646282204, + "learning_rate": 2.403960759145503e-06, + "loss": 0.9548, + "mean_token_accuracy": 0.7121150851249695, + "num_tokens": 269396822.0, + "step": 107760 + }, + { + "epoch": 0.9880810488676997, + "learning_rate": 2.3856239112496563e-06, + "loss": 0.9632, + "mean_token_accuracy": 0.7125303685665131, + "num_tokens": 269424623.0, + "step": 107770 + }, + { + "epoch": 0.9881727331071789, + "learning_rate": 2.36728706335381e-06, + "loss": 0.9601, + "mean_token_accuracy": 0.7132599592208863, + "num_tokens": 269452041.0, + "step": 107780 + }, + { + "epoch": 0.9882644173466582, + "learning_rate": 2.348950215457963e-06, + "loss": 0.9479, + "mean_token_accuracy": 0.7090761542320252, + "num_tokens": 269477961.0, + "step": 107790 + }, + { + "epoch": 0.9883561015861373, + "learning_rate": 2.330613367562116e-06, + "loss": 0.9456, + "mean_token_accuracy": 0.708621370792389, + "num_tokens": 269504979.0, + "step": 107800 + }, + { + "epoch": 0.9884477858256165, + "learning_rate": 2.3122765196662693e-06, + "loss": 0.9555, + "mean_token_accuracy": 0.7117623150348663, + "num_tokens": 269533066.0, + "step": 107810 + }, + { + "epoch": 0.9885394700650958, + "learning_rate": 2.293939671770423e-06, + "loss": 0.9595, + "mean_token_accuracy": 0.710222738981247, + "num_tokens": 269560809.0, + "step": 107820 + }, + { + "epoch": 0.988631154304575, + "learning_rate": 2.275602823874576e-06, + "loss": 0.952, + "mean_token_accuracy": 0.7048126757144928, + "num_tokens": 269589536.0, + "step": 107830 + }, + { + "epoch": 0.9887228385440543, + "learning_rate": 2.2572659759787295e-06, + "loss": 0.9393, + "mean_token_accuracy": 0.711496913433075, + "num_tokens": 269618091.0, + "step": 107840 + }, + { + "epoch": 0.9888145227835335, + "learning_rate": 2.2389291280828827e-06, + "loss": 0.9684, + "mean_token_accuracy": 0.706806880235672, + "num_tokens": 269646262.0, + "step": 107850 + }, + { + "epoch": 0.9889062070230128, + "learning_rate": 2.220592280187036e-06, + "loss": 0.9522, + "mean_token_accuracy": 0.7087924242019653, + "num_tokens": 269674407.0, + "step": 107860 + }, + { + "epoch": 0.9889978912624919, + "learning_rate": 2.2022554322911894e-06, + "loss": 0.9667, + "mean_token_accuracy": 0.7084844768047333, + "num_tokens": 269703500.0, + "step": 107870 + }, + { + "epoch": 0.9890895755019712, + "learning_rate": 2.1839185843953425e-06, + "loss": 0.933, + "mean_token_accuracy": 0.7124791145324707, + "num_tokens": 269730973.0, + "step": 107880 + }, + { + "epoch": 0.9891812597414504, + "learning_rate": 2.165581736499496e-06, + "loss": 0.9329, + "mean_token_accuracy": 0.7177101850509644, + "num_tokens": 269759446.0, + "step": 107890 + }, + { + "epoch": 0.9892729439809297, + "learning_rate": 2.147244888603649e-06, + "loss": 0.948, + "mean_token_accuracy": 0.7117880403995513, + "num_tokens": 269787020.0, + "step": 107900 + }, + { + "epoch": 0.9893646282204089, + "learning_rate": 2.1289080407078023e-06, + "loss": 0.9597, + "mean_token_accuracy": 0.7092513144016266, + "num_tokens": 269814669.0, + "step": 107910 + }, + { + "epoch": 0.9894563124598882, + "learning_rate": 2.110571192811956e-06, + "loss": 0.9611, + "mean_token_accuracy": 0.7070608317852021, + "num_tokens": 269842618.0, + "step": 107920 + }, + { + "epoch": 0.9895479966993673, + "learning_rate": 2.092234344916109e-06, + "loss": 0.9428, + "mean_token_accuracy": 0.714831417798996, + "num_tokens": 269871870.0, + "step": 107930 + }, + { + "epoch": 0.9896396809388466, + "learning_rate": 2.0738974970202626e-06, + "loss": 0.9395, + "mean_token_accuracy": 0.7137292504310608, + "num_tokens": 269899786.0, + "step": 107940 + }, + { + "epoch": 0.9897313651783258, + "learning_rate": 2.0555606491244153e-06, + "loss": 0.933, + "mean_token_accuracy": 0.7155964374542236, + "num_tokens": 269927187.0, + "step": 107950 + }, + { + "epoch": 0.9898230494178051, + "learning_rate": 2.037223801228569e-06, + "loss": 0.9082, + "mean_token_accuracy": 0.7195849716663361, + "num_tokens": 269955587.0, + "step": 107960 + }, + { + "epoch": 0.9899147336572843, + "learning_rate": 2.018886953332722e-06, + "loss": 0.9385, + "mean_token_accuracy": 0.7136310696601867, + "num_tokens": 269982937.0, + "step": 107970 + }, + { + "epoch": 0.9900064178967636, + "learning_rate": 2.0005501054368756e-06, + "loss": 0.9442, + "mean_token_accuracy": 0.7146109282970429, + "num_tokens": 270010417.0, + "step": 107980 + }, + { + "epoch": 0.9900981021362428, + "learning_rate": 1.9822132575410287e-06, + "loss": 0.9608, + "mean_token_accuracy": 0.7055068433284759, + "num_tokens": 270038197.0, + "step": 107990 + }, + { + "epoch": 0.990189786375722, + "learning_rate": 1.963876409645182e-06, + "loss": 0.9737, + "mean_token_accuracy": 0.7058661997318267, + "num_tokens": 270066540.0, + "step": 108000 + }, + { + "epoch": 0.9902814706152012, + "learning_rate": 1.9455395617493354e-06, + "loss": 0.9617, + "mean_token_accuracy": 0.7059551119804383, + "num_tokens": 270094791.0, + "step": 108010 + }, + { + "epoch": 0.9903731548546805, + "learning_rate": 1.9272027138534885e-06, + "loss": 0.9634, + "mean_token_accuracy": 0.7042786717414856, + "num_tokens": 270123404.0, + "step": 108020 + }, + { + "epoch": 0.9904648390941597, + "learning_rate": 1.908865865957642e-06, + "loss": 0.9701, + "mean_token_accuracy": 0.7064362466335297, + "num_tokens": 270151470.0, + "step": 108030 + }, + { + "epoch": 0.990556523333639, + "learning_rate": 1.8905290180617955e-06, + "loss": 0.9676, + "mean_token_accuracy": 0.7073017716407776, + "num_tokens": 270179636.0, + "step": 108040 + }, + { + "epoch": 0.9906482075731182, + "learning_rate": 1.8721921701659488e-06, + "loss": 0.9514, + "mean_token_accuracy": 0.7094836533069611, + "num_tokens": 270207493.0, + "step": 108050 + }, + { + "epoch": 0.9907398918125974, + "learning_rate": 1.8538553222701017e-06, + "loss": 0.9347, + "mean_token_accuracy": 0.7093855202198028, + "num_tokens": 270235131.0, + "step": 108060 + }, + { + "epoch": 0.9908315760520766, + "learning_rate": 1.835518474374255e-06, + "loss": 0.9652, + "mean_token_accuracy": 0.7078740477561951, + "num_tokens": 270263598.0, + "step": 108070 + }, + { + "epoch": 0.9909232602915559, + "learning_rate": 1.8171816264784084e-06, + "loss": 0.9318, + "mean_token_accuracy": 0.7160435378551483, + "num_tokens": 270291199.0, + "step": 108080 + }, + { + "epoch": 0.9910149445310351, + "learning_rate": 1.7988447785825618e-06, + "loss": 0.9584, + "mean_token_accuracy": 0.7111521482467651, + "num_tokens": 270318981.0, + "step": 108090 + }, + { + "epoch": 0.9911066287705144, + "learning_rate": 1.7805079306867151e-06, + "loss": 0.9377, + "mean_token_accuracy": 0.7162557542324066, + "num_tokens": 270347137.0, + "step": 108100 + }, + { + "epoch": 0.9911983130099936, + "learning_rate": 1.7621710827908683e-06, + "loss": 0.9648, + "mean_token_accuracy": 0.7065443277359009, + "num_tokens": 270374958.0, + "step": 108110 + }, + { + "epoch": 0.9912899972494729, + "learning_rate": 1.7438342348950216e-06, + "loss": 0.9354, + "mean_token_accuracy": 0.7149212837219239, + "num_tokens": 270404129.0, + "step": 108120 + }, + { + "epoch": 0.991381681488952, + "learning_rate": 1.725497386999175e-06, + "loss": 0.9375, + "mean_token_accuracy": 0.7164669811725617, + "num_tokens": 270432238.0, + "step": 108130 + }, + { + "epoch": 0.9914733657284313, + "learning_rate": 1.7071605391033283e-06, + "loss": 0.968, + "mean_token_accuracy": 0.7033616840839386, + "num_tokens": 270461170.0, + "step": 108140 + }, + { + "epoch": 0.9915650499679105, + "learning_rate": 1.6888236912074817e-06, + "loss": 0.9381, + "mean_token_accuracy": 0.7152381062507629, + "num_tokens": 270488544.0, + "step": 108150 + }, + { + "epoch": 0.9916567342073898, + "learning_rate": 1.6704868433116346e-06, + "loss": 0.9797, + "mean_token_accuracy": 0.7032285392284393, + "num_tokens": 270515714.0, + "step": 108160 + }, + { + "epoch": 0.991748418446869, + "learning_rate": 1.652149995415788e-06, + "loss": 0.9434, + "mean_token_accuracy": 0.71032155752182, + "num_tokens": 270543296.0, + "step": 108170 + }, + { + "epoch": 0.9918401026863483, + "learning_rate": 1.6338131475199415e-06, + "loss": 0.9267, + "mean_token_accuracy": 0.7193844795227051, + "num_tokens": 270571215.0, + "step": 108180 + }, + { + "epoch": 0.9919317869258274, + "learning_rate": 1.6154762996240949e-06, + "loss": 0.9513, + "mean_token_accuracy": 0.7087843775749206, + "num_tokens": 270599346.0, + "step": 108190 + }, + { + "epoch": 0.9920234711653066, + "learning_rate": 1.5971394517282482e-06, + "loss": 0.9619, + "mean_token_accuracy": 0.7091204702854157, + "num_tokens": 270627760.0, + "step": 108200 + }, + { + "epoch": 0.9921151554047859, + "learning_rate": 1.5788026038324011e-06, + "loss": 0.9077, + "mean_token_accuracy": 0.7241861045360565, + "num_tokens": 270655493.0, + "step": 108210 + }, + { + "epoch": 0.9922068396442651, + "learning_rate": 1.5604657559365545e-06, + "loss": 0.9518, + "mean_token_accuracy": 0.7072457790374755, + "num_tokens": 270683485.0, + "step": 108220 + }, + { + "epoch": 0.9922985238837444, + "learning_rate": 1.5421289080407078e-06, + "loss": 0.9406, + "mean_token_accuracy": 0.7132770359516144, + "num_tokens": 270711649.0, + "step": 108230 + }, + { + "epoch": 0.9923902081232236, + "learning_rate": 1.5237920601448612e-06, + "loss": 0.9824, + "mean_token_accuracy": 0.7037883758544922, + "num_tokens": 270739935.0, + "step": 108240 + }, + { + "epoch": 0.9924818923627029, + "learning_rate": 1.5054552122490145e-06, + "loss": 0.9676, + "mean_token_accuracy": 0.7086636006832123, + "num_tokens": 270768643.0, + "step": 108250 + }, + { + "epoch": 0.992573576602182, + "learning_rate": 1.4871183643531679e-06, + "loss": 0.9596, + "mean_token_accuracy": 0.7082400918006897, + "num_tokens": 270796222.0, + "step": 108260 + }, + { + "epoch": 0.9926652608416613, + "learning_rate": 1.468781516457321e-06, + "loss": 0.9236, + "mean_token_accuracy": 0.7113487184047699, + "num_tokens": 270824348.0, + "step": 108270 + }, + { + "epoch": 0.9927569450811405, + "learning_rate": 1.4504446685614744e-06, + "loss": 0.9335, + "mean_token_accuracy": 0.7143835961818695, + "num_tokens": 270851632.0, + "step": 108280 + }, + { + "epoch": 0.9928486293206198, + "learning_rate": 1.4321078206656277e-06, + "loss": 0.9691, + "mean_token_accuracy": 0.7031129777431488, + "num_tokens": 270879073.0, + "step": 108290 + }, + { + "epoch": 0.992940313560099, + "learning_rate": 1.4137709727697809e-06, + "loss": 0.9621, + "mean_token_accuracy": 0.70713369846344, + "num_tokens": 270907964.0, + "step": 108300 + }, + { + "epoch": 0.9930319977995783, + "learning_rate": 1.3954341248739342e-06, + "loss": 0.9544, + "mean_token_accuracy": 0.7095125436782836, + "num_tokens": 270936402.0, + "step": 108310 + }, + { + "epoch": 0.9931236820390574, + "learning_rate": 1.3770972769780873e-06, + "loss": 0.9407, + "mean_token_accuracy": 0.7117841303348541, + "num_tokens": 270964626.0, + "step": 108320 + }, + { + "epoch": 0.9932153662785367, + "learning_rate": 1.358760429082241e-06, + "loss": 0.9675, + "mean_token_accuracy": 0.7025663137435914, + "num_tokens": 270993097.0, + "step": 108330 + }, + { + "epoch": 0.9933070505180159, + "learning_rate": 1.3404235811863943e-06, + "loss": 0.9263, + "mean_token_accuracy": 0.7160776257514954, + "num_tokens": 271021091.0, + "step": 108340 + }, + { + "epoch": 0.9933987347574952, + "learning_rate": 1.3220867332905474e-06, + "loss": 0.9456, + "mean_token_accuracy": 0.7149143099784852, + "num_tokens": 271048572.0, + "step": 108350 + }, + { + "epoch": 0.9934904189969744, + "learning_rate": 1.3037498853947007e-06, + "loss": 0.9721, + "mean_token_accuracy": 0.7054606318473816, + "num_tokens": 271075801.0, + "step": 108360 + }, + { + "epoch": 0.9935821032364537, + "learning_rate": 1.285413037498854e-06, + "loss": 0.9746, + "mean_token_accuracy": 0.707843953371048, + "num_tokens": 271103833.0, + "step": 108370 + }, + { + "epoch": 0.9936737874759329, + "learning_rate": 1.2670761896030072e-06, + "loss": 0.9489, + "mean_token_accuracy": 0.7131265759468078, + "num_tokens": 271130967.0, + "step": 108380 + }, + { + "epoch": 0.9937654717154121, + "learning_rate": 1.2487393417071606e-06, + "loss": 0.974, + "mean_token_accuracy": 0.7050150334835052, + "num_tokens": 271158191.0, + "step": 108390 + }, + { + "epoch": 0.9938571559548913, + "learning_rate": 1.230402493811314e-06, + "loss": 0.9432, + "mean_token_accuracy": 0.710757851600647, + "num_tokens": 271185860.0, + "step": 108400 + }, + { + "epoch": 0.9939488401943706, + "learning_rate": 1.2120656459154673e-06, + "loss": 0.9674, + "mean_token_accuracy": 0.7087086319923401, + "num_tokens": 271214253.0, + "step": 108410 + }, + { + "epoch": 0.9940405244338498, + "learning_rate": 1.1937287980196206e-06, + "loss": 0.9621, + "mean_token_accuracy": 0.7093576073646546, + "num_tokens": 271242404.0, + "step": 108420 + }, + { + "epoch": 0.9941322086733291, + "learning_rate": 1.1753919501237738e-06, + "loss": 0.9294, + "mean_token_accuracy": 0.7140588998794556, + "num_tokens": 271269773.0, + "step": 108430 + }, + { + "epoch": 0.9942238929128083, + "learning_rate": 1.1570551022279271e-06, + "loss": 1.0008, + "mean_token_accuracy": 0.7005892097949982, + "num_tokens": 271298028.0, + "step": 108440 + }, + { + "epoch": 0.9943155771522875, + "learning_rate": 1.1387182543320803e-06, + "loss": 0.92, + "mean_token_accuracy": 0.7150518417358398, + "num_tokens": 271325650.0, + "step": 108450 + }, + { + "epoch": 0.9944072613917667, + "learning_rate": 1.1203814064362336e-06, + "loss": 0.9756, + "mean_token_accuracy": 0.7039842367172241, + "num_tokens": 271354299.0, + "step": 108460 + }, + { + "epoch": 0.994498945631246, + "learning_rate": 1.102044558540387e-06, + "loss": 0.9615, + "mean_token_accuracy": 0.706362110376358, + "num_tokens": 271382096.0, + "step": 108470 + }, + { + "epoch": 0.9945906298707252, + "learning_rate": 1.0837077106445403e-06, + "loss": 0.953, + "mean_token_accuracy": 0.7117473840713501, + "num_tokens": 271410248.0, + "step": 108480 + }, + { + "epoch": 0.9946823141102045, + "learning_rate": 1.0653708627486937e-06, + "loss": 0.9504, + "mean_token_accuracy": 0.7121224582195282, + "num_tokens": 271438094.0, + "step": 108490 + }, + { + "epoch": 0.9947739983496837, + "learning_rate": 1.0470340148528468e-06, + "loss": 0.9419, + "mean_token_accuracy": 0.7153161048889161, + "num_tokens": 271466215.0, + "step": 108500 + }, + { + "epoch": 0.994865682589163, + "learning_rate": 1.0286971669570001e-06, + "loss": 0.9281, + "mean_token_accuracy": 0.7177415311336517, + "num_tokens": 271494690.0, + "step": 108510 + }, + { + "epoch": 0.9949573668286421, + "learning_rate": 1.0103603190611535e-06, + "loss": 0.9482, + "mean_token_accuracy": 0.7120618402957917, + "num_tokens": 271523304.0, + "step": 108520 + }, + { + "epoch": 0.9950490510681214, + "learning_rate": 9.920234711653066e-07, + "loss": 0.9501, + "mean_token_accuracy": 0.7138809025287628, + "num_tokens": 271552187.0, + "step": 108530 + }, + { + "epoch": 0.9951407353076006, + "learning_rate": 9.7368662326946e-07, + "loss": 0.9444, + "mean_token_accuracy": 0.7139100313186646, + "num_tokens": 271580179.0, + "step": 108540 + }, + { + "epoch": 0.9952324195470799, + "learning_rate": 9.553497753736133e-07, + "loss": 0.9949, + "mean_token_accuracy": 0.6991130471229553, + "num_tokens": 271605081.0, + "step": 108550 + }, + { + "epoch": 0.9953241037865591, + "learning_rate": 9.370129274777666e-07, + "loss": 0.9518, + "mean_token_accuracy": 0.7130214869976044, + "num_tokens": 271633152.0, + "step": 108560 + }, + { + "epoch": 0.9954157880260384, + "learning_rate": 9.186760795819199e-07, + "loss": 0.9566, + "mean_token_accuracy": 0.7135081589221954, + "num_tokens": 271660525.0, + "step": 108570 + }, + { + "epoch": 0.9955074722655176, + "learning_rate": 9.003392316860732e-07, + "loss": 0.9443, + "mean_token_accuracy": 0.7129908621311187, + "num_tokens": 271688678.0, + "step": 108580 + }, + { + "epoch": 0.9955991565049968, + "learning_rate": 8.820023837902265e-07, + "loss": 0.9484, + "mean_token_accuracy": 0.711221432685852, + "num_tokens": 271716407.0, + "step": 108590 + }, + { + "epoch": 0.995690840744476, + "learning_rate": 8.636655358943799e-07, + "loss": 0.9509, + "mean_token_accuracy": 0.7100203394889831, + "num_tokens": 271743725.0, + "step": 108600 + }, + { + "epoch": 0.9957825249839553, + "learning_rate": 8.45328687998533e-07, + "loss": 0.9633, + "mean_token_accuracy": 0.706583422422409, + "num_tokens": 271772720.0, + "step": 108610 + }, + { + "epoch": 0.9958742092234345, + "learning_rate": 8.269918401026865e-07, + "loss": 0.9531, + "mean_token_accuracy": 0.713868010044098, + "num_tokens": 271800659.0, + "step": 108620 + }, + { + "epoch": 0.9959658934629138, + "learning_rate": 8.086549922068396e-07, + "loss": 0.9472, + "mean_token_accuracy": 0.7135761678218842, + "num_tokens": 271829073.0, + "step": 108630 + }, + { + "epoch": 0.996057577702393, + "learning_rate": 7.90318144310993e-07, + "loss": 0.9296, + "mean_token_accuracy": 0.7176508367061615, + "num_tokens": 271857684.0, + "step": 108640 + }, + { + "epoch": 0.9961492619418721, + "learning_rate": 7.719812964151463e-07, + "loss": 0.9427, + "mean_token_accuracy": 0.7142350792884826, + "num_tokens": 271885236.0, + "step": 108650 + }, + { + "epoch": 0.9962409461813514, + "learning_rate": 7.536444485192995e-07, + "loss": 0.9592, + "mean_token_accuracy": 0.7084473371505737, + "num_tokens": 271913274.0, + "step": 108660 + }, + { + "epoch": 0.9963326304208306, + "learning_rate": 7.353076006234529e-07, + "loss": 0.9529, + "mean_token_accuracy": 0.7091939210891723, + "num_tokens": 271940681.0, + "step": 108670 + }, + { + "epoch": 0.9964243146603099, + "learning_rate": 7.169707527276061e-07, + "loss": 0.9558, + "mean_token_accuracy": 0.7062992513179779, + "num_tokens": 271968803.0, + "step": 108680 + }, + { + "epoch": 0.9965159988997891, + "learning_rate": 6.986339048317595e-07, + "loss": 0.9429, + "mean_token_accuracy": 0.7165329098701477, + "num_tokens": 271996730.0, + "step": 108690 + }, + { + "epoch": 0.9966076831392684, + "learning_rate": 6.802970569359127e-07, + "loss": 0.9452, + "mean_token_accuracy": 0.7138762652873993, + "num_tokens": 272024490.0, + "step": 108700 + }, + { + "epoch": 0.9966993673787476, + "learning_rate": 6.619602090400661e-07, + "loss": 0.9569, + "mean_token_accuracy": 0.7109337151050568, + "num_tokens": 272050972.0, + "step": 108710 + }, + { + "epoch": 0.9967910516182268, + "learning_rate": 6.436233611442193e-07, + "loss": 0.9528, + "mean_token_accuracy": 0.7097187757492065, + "num_tokens": 272078689.0, + "step": 108720 + }, + { + "epoch": 0.996882735857706, + "learning_rate": 6.252865132483727e-07, + "loss": 0.9488, + "mean_token_accuracy": 0.710624486207962, + "num_tokens": 272106417.0, + "step": 108730 + }, + { + "epoch": 0.9969744200971853, + "learning_rate": 6.069496653525259e-07, + "loss": 0.9253, + "mean_token_accuracy": 0.7121653497219086, + "num_tokens": 272134030.0, + "step": 108740 + }, + { + "epoch": 0.9970661043366645, + "learning_rate": 5.886128174566792e-07, + "loss": 0.9305, + "mean_token_accuracy": 0.7163199841976166, + "num_tokens": 272161855.0, + "step": 108750 + }, + { + "epoch": 0.9971577885761438, + "learning_rate": 5.702759695608325e-07, + "loss": 0.953, + "mean_token_accuracy": 0.7092844486236572, + "num_tokens": 272189414.0, + "step": 108760 + }, + { + "epoch": 0.997249472815623, + "learning_rate": 5.519391216649859e-07, + "loss": 0.9543, + "mean_token_accuracy": 0.7108266532421113, + "num_tokens": 272217548.0, + "step": 108770 + }, + { + "epoch": 0.9973411570551022, + "learning_rate": 5.336022737691391e-07, + "loss": 0.9519, + "mean_token_accuracy": 0.71286461353302, + "num_tokens": 272245748.0, + "step": 108780 + }, + { + "epoch": 0.9974328412945814, + "learning_rate": 5.152654258732924e-07, + "loss": 0.9713, + "mean_token_accuracy": 0.7049710333347321, + "num_tokens": 272273014.0, + "step": 108790 + }, + { + "epoch": 0.9975245255340607, + "learning_rate": 4.969285779774457e-07, + "loss": 0.9808, + "mean_token_accuracy": 0.7022957563400268, + "num_tokens": 272301065.0, + "step": 108800 + }, + { + "epoch": 0.9976162097735399, + "learning_rate": 4.785917300815991e-07, + "loss": 0.9772, + "mean_token_accuracy": 0.7063236474990845, + "num_tokens": 272328845.0, + "step": 108810 + }, + { + "epoch": 0.9977078940130192, + "learning_rate": 4.602548821857523e-07, + "loss": 0.946, + "mean_token_accuracy": 0.7124539732933044, + "num_tokens": 272356524.0, + "step": 108820 + }, + { + "epoch": 0.9977995782524984, + "learning_rate": 4.419180342899056e-07, + "loss": 0.9525, + "mean_token_accuracy": 0.7134114861488342, + "num_tokens": 272384910.0, + "step": 108830 + }, + { + "epoch": 0.9978912624919777, + "learning_rate": 4.2358118639405884e-07, + "loss": 0.9209, + "mean_token_accuracy": 0.7175331294536591, + "num_tokens": 272413154.0, + "step": 108840 + }, + { + "epoch": 0.9979829467314568, + "learning_rate": 4.052443384982122e-07, + "loss": 0.963, + "mean_token_accuracy": 0.7068632543087006, + "num_tokens": 272441661.0, + "step": 108850 + }, + { + "epoch": 0.9980746309709361, + "learning_rate": 3.869074906023655e-07, + "loss": 0.9593, + "mean_token_accuracy": 0.7033331573009491, + "num_tokens": 272470052.0, + "step": 108860 + }, + { + "epoch": 0.9981663152104153, + "learning_rate": 3.685706427065188e-07, + "loss": 0.969, + "mean_token_accuracy": 0.7020613729953766, + "num_tokens": 272498173.0, + "step": 108870 + }, + { + "epoch": 0.9982579994498946, + "learning_rate": 3.502337948106721e-07, + "loss": 0.9765, + "mean_token_accuracy": 0.7058265626430511, + "num_tokens": 272526028.0, + "step": 108880 + }, + { + "epoch": 0.9983496836893738, + "learning_rate": 3.318969469148254e-07, + "loss": 0.927, + "mean_token_accuracy": 0.7112305581569671, + "num_tokens": 272554507.0, + "step": 108890 + }, + { + "epoch": 0.9984413679288531, + "learning_rate": 3.135600990189786e-07, + "loss": 0.9531, + "mean_token_accuracy": 0.7085698962211608, + "num_tokens": 272583042.0, + "step": 108900 + }, + { + "epoch": 0.9985330521683322, + "learning_rate": 2.9522325112313197e-07, + "loss": 0.951, + "mean_token_accuracy": 0.7063367486000061, + "num_tokens": 272610733.0, + "step": 108910 + }, + { + "epoch": 0.9986247364078115, + "learning_rate": 2.768864032272852e-07, + "loss": 0.9817, + "mean_token_accuracy": 0.705414742231369, + "num_tokens": 272638792.0, + "step": 108920 + }, + { + "epoch": 0.9987164206472907, + "learning_rate": 2.5854955533143856e-07, + "loss": 0.9997, + "mean_token_accuracy": 0.7029419541358948, + "num_tokens": 272666918.0, + "step": 108930 + }, + { + "epoch": 0.99880810488677, + "learning_rate": 2.402127074355918e-07, + "loss": 0.9656, + "mean_token_accuracy": 0.7078922510147094, + "num_tokens": 272694387.0, + "step": 108940 + }, + { + "epoch": 0.9988997891262492, + "learning_rate": 2.2187585953974516e-07, + "loss": 0.9329, + "mean_token_accuracy": 0.7136320233345032, + "num_tokens": 272720667.0, + "step": 108950 + }, + { + "epoch": 0.9989914733657285, + "learning_rate": 2.0353901164389843e-07, + "loss": 0.9608, + "mean_token_accuracy": 0.7071583569049835, + "num_tokens": 272748319.0, + "step": 108960 + }, + { + "epoch": 0.9990831576052077, + "learning_rate": 1.8520216374805172e-07, + "loss": 0.966, + "mean_token_accuracy": 0.7109744012355804, + "num_tokens": 272776982.0, + "step": 108970 + }, + { + "epoch": 0.9991748418446869, + "learning_rate": 1.6686531585220502e-07, + "loss": 0.9342, + "mean_token_accuracy": 0.7147205471992493, + "num_tokens": 272804956.0, + "step": 108980 + }, + { + "epoch": 0.9992665260841661, + "learning_rate": 1.4852846795635832e-07, + "loss": 0.9635, + "mean_token_accuracy": 0.7084476709365845, + "num_tokens": 272833433.0, + "step": 108990 + }, + { + "epoch": 0.9993582103236454, + "learning_rate": 1.3019162006051161e-07, + "loss": 0.9791, + "mean_token_accuracy": 0.7073094964027404, + "num_tokens": 272861260.0, + "step": 109000 + }, + { + "epoch": 0.9994498945631246, + "learning_rate": 1.1185477216466491e-07, + "loss": 0.9614, + "mean_token_accuracy": 0.7112366139888764, + "num_tokens": 272889446.0, + "step": 109010 + }, + { + "epoch": 0.9995415788026039, + "learning_rate": 9.35179242688182e-08, + "loss": 0.9253, + "mean_token_accuracy": 0.7157534658908844, + "num_tokens": 272917134.0, + "step": 109020 + }, + { + "epoch": 0.9996332630420831, + "learning_rate": 7.518107637297149e-08, + "loss": 0.9747, + "mean_token_accuracy": 0.7045438110828399, + "num_tokens": 272945009.0, + "step": 109030 + }, + { + "epoch": 0.9997249472815622, + "learning_rate": 5.684422847712479e-08, + "loss": 0.9436, + "mean_token_accuracy": 0.7104832291603088, + "num_tokens": 272973145.0, + "step": 109040 + }, + { + "epoch": 0.9998166315210415, + "learning_rate": 3.8507380581278085e-08, + "loss": 0.9714, + "mean_token_accuracy": 0.7046187996864319, + "num_tokens": 273000995.0, + "step": 109050 + }, + { + "epoch": 1.0000366736957917, + "learning_rate": 2.0170532685431375e-08, + "loss": 0.9708, + "mean_token_accuracy": 0.705879271030426, + "num_tokens": 273021976.0, + "step": 109060 + }, + { + "epoch": 1.0001283579352709, + "learning_rate": 1.8336847895846704e-09, + "loss": 0.9834, + "mean_token_accuracy": 0.7151719331741333, + "num_tokens": 273045815.0, + "step": 109070 + } + ], + "logging_steps": 10, + "max_steps": 109070, + "num_input_tokens_seen": 0, + "num_train_epochs": 9223372036854775807, + "save_steps": 6816, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.7755502837531136e+19, + "train_batch_size": 8, + "trial_name": null, + "trial_params": null +}